diff --git a/COPYING b/COPYING
index 1f3e6505..782c7bb6 100644
--- a/COPYING
+++ b/COPYING
@@ -1,14 +1,14 @@
-Copyright (c) 2014 The MatConvNet team.
+Copyright (c) 2014-16 The MatConvNet Team.
 All rights reserved.
 
 Redistribution and use in source and binary forms are permitted
 provided that the above copyright notice and this paragraph are
-duplicated in all such forms and that any documentation,
-advertising materials, and other materials related to such
-distribution and use acknowledge that the software was developed
-by the <organization>. The name of the
-<organization> may not be used to endorse or promote products derived
-from this software without specific prior written permission.
-THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
-IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
\ No newline at end of file
+duplicated in all such forms and that any documentation, advertising
+materials, and other materials related to such distribution and use
+acknowledge that the software was developed by the MatConvNet
+Team. The name of the MatConvNet Team may not be used to endorse or
+promote products derived from this software without specific prior
+written permission.  THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+PURPOSE.
\ No newline at end of file
diff --git a/Makefile b/Makefile
index 165729a7..246d8bda 100644
--- a/Makefile
+++ b/Makefile
@@ -20,10 +20,10 @@ DEBUG ?=
 ARCH ?= maci64
 
 # Configure MATLAB
-MATLABROOT ?= /Applications/MATLAB_R2015a.app
+MATLABROOT ?= /Applications/MATLAB_R2017a.app
 
 # Configure CUDA and CuDNN. CUDAMETHOD can be either 'nvcc' or 'mex'.
-CUDAROOT ?= /Developer/NVIDIA/CUDA-6.5
+CUDAROOT ?= /Developer/NVIDIA/CUDA-8.0
 CUDNNROOT ?= $(CURDIR)/local/
 CUDAMETHOD ?= $(if $(ENABLE_CUDNN),nvcc,mex)
 
@@ -38,7 +38,7 @@ CUDAMETHOD ?= $(if $(ENABLE_CUDNN),nvcc,mex)
 
 # Maintenance
 NAME = matconvnet
-VER = 1.0-beta22
+VER = 1.0-beta24
 DIST = $(NAME)-$(VER)
 LATEST = $(NAME)-latest
 RSYNC = rsync
@@ -82,7 +82,7 @@ LDFLAGS =
 LDOPTIMFLAGS =
 LINKLIBS = -lmwblas
 
-NVCCFLAGS_PASS = -gencode=arch=compute_30,code=\"sm_30,compute_30\"
+NVCCFLAGS_PASS = -D_FORCE_INLINES -gencode=arch=compute_30,code=\"sm_30,compute_30\"
 NVCCVER = $(shell $(NVCC) --version | \
 sed -n 's/.*V\([0-9]*\).\([0-9]*\).\([0-9]*\).*/\1 \2 \3/p' | \
 xargs printf '%02d%02d%02d')
@@ -159,12 +159,14 @@ cpp_src+=matlab/src/bits/nnpooling.$(ext)
 cpp_src+=matlab/src/bits/nnnormalize.$(ext)
 cpp_src+=matlab/src/bits/nnbnorm.$(ext)
 cpp_src+=matlab/src/bits/nnbilinearsampler.$(ext)
+cpp_src+=matlab/src/bits/nnroipooling.$(ext)
 mex_src+=matlab/src/vl_nnconv.$(ext)
 mex_src+=matlab/src/vl_nnconvt.$(ext)
 mex_src+=matlab/src/vl_nnpool.$(ext)
 mex_src+=matlab/src/vl_nnnormalize.$(ext)
 mex_src+=matlab/src/vl_nnbnorm.$(ext)
 mex_src+=matlab/src/vl_nnbilinearsampler.$(ext)
+mex_src+=matlab/src/vl_nnroipool.$(ext)
 mex_src+=matlab/src/vl_taccummex.$(ext)
 mex_src+=matlab/src/vl_tmove.$(ext)
 ifdef ENABLE_IMREADJPEG
@@ -180,6 +182,7 @@ cpp_src+=matlab/src/bits/impl/pooling_cpu.cpp
 cpp_src+=matlab/src/bits/impl/normalize_cpu.cpp
 cpp_src+=matlab/src/bits/impl/bnorm_cpu.cpp
 cpp_src+=matlab/src/bits/impl/bilinearsampler_cpu.cpp
+cpp_src+=matlab/src/bits/impl/roipooling_cpu.cpp
 cpp_src+=matlab/src/bits/impl/tinythread.cpp
 ifdef ENABLE_IMREADJPEG
 cpp_src+=matlab/src/bits/impl/imread_$(IMAGELIB).cpp
@@ -195,6 +198,7 @@ cpp_src+=matlab/src/bits/impl/pooling_gpu.cu
 cpp_src+=matlab/src/bits/impl/normalize_gpu.cu
 cpp_src+=matlab/src/bits/impl/bnorm_gpu.cu
 cpp_src+=matlab/src/bits/impl/bilinearsampler_gpu.cu
+cpp_src+=matlab/src/bits/impl/roipooling_gpu.cu
 cpp_src+=matlab/src/bits/datacu.cu
 mex_src+=matlab/src/vl_cudatool.cu
 ifdef ENABLE_CUDNN
@@ -255,7 +259,7 @@ CXXOPTIMFLAGS='$$CXXOPTIMFLAGS $(call nvcc-quote,$(CXXOPTIMFLAGS))'
 MEXFLAGS_LD := $(MEXFLAGS) \
 LDFLAGS='$$LDFLAGS $(LDFLAGS)' \
 LDOPTIMFLAGS='$$LDOPTIMFLAGS $(LDOPTIMFLAGS)' \
-LINKLIBS='$$LINKLIBS $(LINKLIBS)' \
+LINKLIBS='$(LINKLIBS) $$LINKLIBS' \
 
 NVCCFLAGS = $(CXXFLAGS) $(NVCCFLAGS_PASS) \
 -I"$(MATLABROOT)/extern/include" \
diff --git a/doc/Makefile b/doc/Makefile
index 06a48506..0382579b 100644
--- a/doc/Makefile
+++ b/doc/Makefile
@@ -28,6 +28,7 @@ vl_nnnormalizelp.m \
 vl_nnpdist.m \
 vl_nnpool.m \
 vl_nnrelu.m \
+vl_nnroipool.m \
 vl_nnsigmoid.m \
 vl_nnsoftmax.m \
 vl_nnsoftmaxloss.m \
@@ -38,6 +39,7 @@ vl_imreadjpeg.m \
 vl_imreadjpeg.m \
 vl_taccum.m \
 vl_tmove.m \
+vl_tshow.m \
 simplenn/vl_simplenn.m \
 simplenn/vl_simplenn_diagnose.m \
 simplenn/vl_simplenn_tidy.m \
diff --git a/doc/blocks.tex b/doc/blocks.tex
index 72ed12a5..ee27bdb2 100644
--- a/doc/blocks.tex
+++ b/doc/blocks.tex
@@ -214,6 +214,46 @@ \section{Spatial bilinear resampling}\label{s:spatial-sampler}
 
 See \cref{s:impl-sampler} for implementation details.
 
+% ------------------------------------------------------------------
+\section{Region of interest pooling}\label{s:roi-pooling}
+% ------------------------------------------------------------------
+
+The \emph{region of interest (ROI) pooling} block applies max or average pooling to specified subwindows of a tensor. A region is a rectangular region $R = (u_-,v_-,u_+,v_+)$. The region itself is partitioned into $(H',W')$ tiles along the vertical and horizontal directions. The edges of the tiles have coordinates
+\begin{align*}
+   v_{i'} &= v_- + (v_+ - v_- + 1) (i' - 1), \quad i' = 1,\dots,H',\\
+   u_{j'} &= u_- + (u_+ - u_- + 1) (j' - 1), \quad j' = 1,\dots,W'.
+\end{align*}
+Following the implementation of~\cite{girshick15fast}, the $H'\times W'$ pooling tiles are given by
+\[
+   \Omega_{i'j'} =
+   \{\lfloor v_{i'} \rfloor + 1, \dots, \lceil v_{i'+1} \rceil\}
+   \times
+   \{\lfloor u_{i'} \rfloor + 1, \dots, \lceil u_{i'+1} \rceil\}.
+\]
+Then the input and output tensors are as follows:
+\[
+  \bx \in \mathbb{R}^{H \times W \times C},
+  \qquad
+  \by \in \mathbb{R}^{H' \times W' \times C},
+\]
+where
+\[
+   y_{i'j'c} = \operatornamewithlimits{max}_{(i,j) \in \Omega_{i'j'}} x_{ijc}.
+\]
+Alternatively, $\max$ can be replaced by the averaging operator.
+
+The extent of each region is defined by four coordinates as specified above; however, differently from tensor indexes, these use $(0,0)$ as the coordinate of the top-left pixel. In fact, if there is a single tile ($H'=W'=1$), then the region $(0,0,H-1,W-1)$ covers the whole input image:
+\[
+   \Omega_{11} =
+   \{1, \dots, W\}
+   \times
+   \{1, \dots, H\}.
+\]
+
+In more details, the input of the block is a sequence of $K$ regions. Each region pools one of the $T$ images in the batch stored in $\bx \in \mathbb{R}^{H\times W\times C\times T}$. Regions are therefore specified as a tensor $R \in \mathbb{R}^{5 \times K}$, where the first coordinate is the index of the pooled image in the batch. The output is a $\by \in \mathbb{R}^{H' \times W' \times C \times K}$ tensor.
+
+For compatibility with~\cite{girshick15fast}, furthermore, the region coordinates are rounded to the nearest integer before the definitions above are used. Note also that, due to the discretization details, 1) tiles always contain at least one pixel, 2) there can be a pixel of overlap between them and 3) the discretization has a slight bias towards left-top pixels.
+
 % ------------------------------------------------------------------
 \section{Normalization}\label{s:normalization}
 % ------------------------------------------------------------------
diff --git a/doc/impl.tex b/doc/impl.tex
index 65dc9217..93179e43 100644
--- a/doc/impl.tex
+++ b/doc/impl.tex
@@ -167,7 +167,7 @@ \section{Spatial pooling}\label{s:impl-pooling}
 \frac{d z}{d (\vv \by)^\top}
 S(\bx),
 $
-for all but a null set of points, where the operator is not differentiable (this usually does not pose problems in optimization by stochastic gradient). For max-pooling, similar relations exists with two differences: $S$ does not depend on the input $\bx$ and it is not binary, in order to account for the normalization factors. In summary, we have the expressions:
+for all but a null set of points, where the operator is not differentiable (this usually does not pose problems in optimization by stochastic gradient). For average pooling, similar relations exists with two differences: $S$ does not depend on the input $\bx$ and it is not binary, in order to account for the normalization factors. In summary, we have the expressions:
 \begin{equation}\label{e:max-mat}
 \boxed{
 \vv\by = S(\bx) \vv \bx,
@@ -429,12 +429,12 @@ \subsection{Spatial normalization}\label{s:impl-spnorm}
 The derivative of spatial normalization can be obtained as follows:
 \begin{align*}
 \frac{dz}{dx_{ijd}} 
-&= \sum_{i''j''d}
+&= \sum_{i''j''}
 \frac{dz}{d y_{i''j''d}} 
 \frac{d y_{i''j''d}}{d x_{ijd}}
 \\
 &=
-\sum_{i''j''d}
+\sum_{i''j''}
 \frac{dz}{d y_{i''j''d}} 
 (1 + \alpha n_{i''j''d}^2)^{-\beta}
 \frac{dx_{i''j''d}}{d x_{ijd}} 
@@ -450,7 +450,7 @@ \subsection{Spatial normalization}\label{s:impl-spnorm}
 (1 + \alpha n_{ijd}^2)^{-\beta}
 -2\alpha\beta x_{ijd}
 \left[
-\sum_{i''j''d}
+\sum_{i''j''}
 \frac{dz}{d y_{i''j''d}} 
 (1 + \alpha n_{i''j''d}^2)^{-\beta-1}
 x_{i''j''d}
@@ -462,7 +462,7 @@ \subsection{Spatial normalization}\label{s:impl-spnorm}
 (1 + \alpha n_{ijd}^2)^{-\beta}
 -2\alpha\beta x_{ijd}
 \left[
-\sum_{i''j''d}
+\sum_{i''j''}
 \eta_{i''j''d}
 \frac{dn_{i''j''d}^2}{d (x_{ijd}^2)}
 \right],
diff --git a/doc/intro.tex b/doc/intro.tex
index 1d017aa4..729d3e63 100644
--- a/doc/intro.tex
+++ b/doc/intro.tex
@@ -25,8 +25,8 @@ \section{Getting started}\label{s:getting-statrted}
 \begin{lstlisting}[escapechar=!]
 % install and compile MatConvNet (run once)
 untar(['http://www.vlfeat.org/matconvnet/download/' ...
-   'matconvnet-1.0-beta12.tar.gz']) ;
-cd matconvnet-1.0-beta12
+   'matconvnet-1.0-beta24.tar.gz']) ;
+cd matconvnet-1.0-beta24
 run matlab/vl_compilenn
 
 % download a pre-trained CNN from the web (run once)
diff --git a/doc/matdocparser.py b/doc/matdocparser.py
index 41ee51b7..8e49ed71 100644
--- a/doc/matdocparser.py
+++ b/doc/matdocparser.py
@@ -51,7 +51,7 @@
 import re
 
 __mpname__           = 'MatDocParser'
-__version__          = '1.0-beta15'
+__version__          = '1.0-beta24'
 __date__             = '2015-09-20'
 __description__      = 'MatDoc MATLAB inline function description interpreter.'
 __long_description__ = __doc__
diff --git a/doc/site/docs/about.md b/doc/site/docs/about.md
index 4a1caef9..26c05cdc 100644
--- a/doc/site/docs/about.md
+++ b/doc/site/docs/about.md
@@ -23,6 +23,28 @@ here.
 <a name='changes'></a>
 # Changes
 
+-   1.0-beta24 (March 2017).
+
+    **New features**
+
+    * New toy example `cnn_toy_data.m` demonstrating using a
+      customized `imdb`.
+    * `vl_argparse.m` now supports dot paths and ignoring missing
+      defaults.
+    * Support for different example solvers (AdaGrad, Adam, AdaDelta,
+      RMSProp) and ability to add new ones.
+    * A new function `vl_tshow.m` to glance at tensors.
+    * Bugfixes.
+
+-   1.0-beta23 (September 2016).
+
+    **New features**
+
+    * A new function `vl_nnroipool.m` for region of interest pooling,
+      supporting networks such as Fast-RCNN.
+    * Imported Fast-RCNN models from Caffe.
+    * An example Fast-RCNN implementation, training and testing.
+
 -   1.0-beta22 (Spetember 2016).
 
     * Bugfixes.
diff --git a/doc/site/docs/css/fixes.css b/doc/site/docs/css/fixes.css
index fb8e4c27..0a0090c2 100644
--- a/doc/site/docs/css/fixes.css
+++ b/doc/site/docs/css/fixes.css
@@ -66,7 +66,7 @@ a  { color: #00438E ; }
 
 #Functions .dropdown-menu {
   color: #000;
-  max-height: 400px;
+  max-height: 800px;
   width: 342px;
 }
 
diff --git a/doc/site/docs/functions.md b/doc/site/docs/functions.md
index 261e09ce..83eb4198 100644
--- a/doc/site/docs/functions.md
+++ b/doc/site/docs/functions.md
@@ -33,6 +33,7 @@ showing how to train CNNs.
 - [`vl_nnpdist`](mfiles/vl_nnpdist.md) Pairwise distances.
 - [`vl_nnpool`](mfiles/vl_nnpool.md) Max and sum pooling.
 - [`vl_nnrelu`](mfiles/vl_nnrelu.md) Rectified Linear Unit.
+- [`vl_nnroipool`](mfiles/vl_nnroipool.md) Reegion of interest pooling.
 - [`vl_nnsigmoid`](mfiles/vl_nnsigmoid.md) Sigmoid.
 - [`vl_nnsoftmax`](mfiles/vl_nnsoftmax.md) Channel soft-max.
 - [`vl_nnsoftmaxloss`](mfiles/vl_nnsoftmaxloss.md) *Deprecated*
@@ -70,3 +71,4 @@ showing how to train CNNs.
 - [`vl_imreadjpeg`](mfiles/vl_imreadjpeg.md) Quickly load a batch of JPEG images.
 - [`vl_taccum`](mfiles/vl_taccum.md) Accumulate tensors operating in-place when possible.
 - [`vl_tmove`](mfiles/vl_tmove.md) Exchange tensors between MATLAB processes and GPUs.
+- [`vl_tshow`](mfiles/vl_tshow.md) Show a tensor on screen.
diff --git a/doc/site/docs/index.md b/doc/site/docs/index.md
index d86e5f5a..90b8ad68 100644
--- a/doc/site/docs/index.md
+++ b/doc/site/docs/index.md
@@ -2,7 +2,7 @@
 
 <div class="row" style="white-space: nowrap;">
 <div class="col-sm-3">
-<a href="download/matconvnet-1.0-beta21.tar.gz">
+<a href="download/matconvnet-1.0-beta24.tar.gz">
 <div class="menuicon"><span class="fa fa-download fa-2x"></span></div>
 Download</a>
 </div>
@@ -31,6 +31,12 @@ efficient, and can run and learn state-of-the-art CNNs. Many
 pre-trained CNNs for image classification, segmentation, face
 recognition, and text detection are available.
 
+> **New:** [1.0-beta24](about.md#changes) released with bugfixes, new
+> examples, and utility functions.
+>
+> **New:** [1.0-beta23](about.md#changes) released with
+> [`vl_nnroipool`](mfiles/vl_nnroipool) and a Fast-RCNN demo.
+>
 > **New:** [1.0-beta22](about.md#changes) released with a few bugfixes.
 >
 > **New:** [1.0-beta21](about.md#changes) provides two new tools,
@@ -52,7 +58,7 @@ recognition, and text detection are available.
 > numerous other improvements and bugfixes.
 
 ## Obtaining MatConvNet
-- <span class="fa fa-file-archive-o"></span>&nbsp;Tarball for [version 1.0-beta22](download/matconvnet-1.0-beta22.tar.gz); [older versions](download/) (<span class="fa fa-apple"/> <span class="fa fa-windows"/> <span class="fa fa-linux"/>)
+- <span class="fa fa-file-archive-o"></span>&nbsp;Tarball for [version 1.0-beta24](download/matconvnet-1.0-beta24.tar.gz); [older versions](download/) (<span class="fa fa-apple"/> <span class="fa fa-windows"/> <span class="fa fa-linux"/>)
 - <span class="fa fa-github"></span>&nbsp;[GIT repository](http://www.github.com/vlfeat/matconvnet.git)
 - <span class="fa fa-pencil-square-o"></span>&nbsp;<a href="javascript:void(0);"
   onclick="toggle_visibility('citation');">Citation</a>
diff --git a/doc/site/docs/install.md b/doc/site/docs/install.md
index 96e379fc..c8b71682 100644
--- a/doc/site/docs/install.md
+++ b/doc/site/docs/install.md
@@ -21,7 +21,7 @@ To test GPU support (if you have [compiled it](#gpu)) use instead:
     > vl_testnn('gpu', true)
 
 Note that the second tests runs slower than the CPU version; do not
-worry, this is an artefact of the test procedure.
+worry, this is an artifact of the test procedure.
 
 <a name='compiling'></a>
 ## Compiling
@@ -42,6 +42,30 @@ library:
 
 1.  Make sure that MATLAB is
     [configured to use your compiler](http://www.mathworks.com/help/matlab/matlab_external/changing-default-compiler.html).
+    In particular, before running `vl_compilenn` do not forget to setup
+    mex (once is sufficient) as follows:
+
+    ```
+    mex -setup
+    ```
+
+    The prerequisites are as follows:
+
+    * For **macOS**, make sure you have Xcode installed. Note the special
+      requirements for GPU below.
+
+    * For **Linux**, make sure GCC and LibJPEG are installed. To
+      install LibJPEG in and Ubuntu/Debian-like distributions use:
+      ```
+      sudo apt-get install build-essential libjpeg-turbo8-dev
+      ```
+      For Fedora/Centos/RedHat-like distributions use instead:
+      ```
+      sudo yum install gcc gcc-c++ libjpeg-turbo-devel
+      ```
+
+    * For **Windows**, you need to install Visual Studio 2010 or greater.
+
 2.  Open MATLAB and issue the commands:
 
         > cd <MatConvNet>
@@ -57,7 +81,7 @@ problem by running the compilation script again in verbose mode:
 Increase the verbosity level to 2 to get even more information.
 
 > **Remark:** The 'vl_imreadjpeg' tool uses an external image library
-> to load images. In Mac OS X and Windows, the default is to use the
+> to load images. In macOS and Windows, the default is to use the
 > system libraries (Quartz and GDI+ respectively), so this dependency
 > is immaterial. In Linux, this tool requires the LibJPEG
 > library and the corresponding development files to be installed in
@@ -72,21 +96,42 @@ Increase the verbosity level to 2 to get even more information.
 
 To use the GPU-accelerated version of the library, you will need a
 NVIDA GPU card with compute capability 2.0 or greater and a copy of
-the NVIDIA CUDA toolkit. Ideally, the version of the CUDA toolkit
-should match your MATLAB version:
+the NVIDIA CUDA toolkit. Officially, MATLAB supports the following
+CUDA versions:
 
 | MATLAB    | CUDA toolkit      |
 |-----------|-------------------|
-| R2013b    | 5.5               |
-| R2014a    | 5.5               |
-| R2014b    | 6.0               |
-| R2015a    | 6.5               |
+| R2017a    | 8.0               |
+| R2016b    | 7.5               |
+| R2016a    | 7.5               |
 | R2015b    | 7.0               |
+| R2015a    | 6.5               |
+| R2014b    | 6.0               |
+| R2014a    | 5.5               |
+| R2013b    | 5.5               |
 
 You can also use the `gpuDevice` MATLAB command to find out MATLAB's
-version of the CUDA toolkit. It is also possible (and often necessary)
-to use a more recent version of CUDA than the one officially supported
-by MATLAB; this is [explained later](#nvcc).
+version of the CUDA toolkit. Nevertheless, it is also possible and
+often useful to use a more recent version of CUDA than the one
+officially supported by MATLAB; this is [explained later](#nvcc).
+
+> **macOS**. CUDA is typically one or two step behind the latest
+> Xcode. For example, CUDA 8.0 requires Xcode 7.3.1 instead of more
+> recent versions. You should:
+>
+> 1. Install Xcode 7.3.1 alongside other versions (e.g. in
+>    `/Applications/Xcode7.3.1.app`).
+
+> 2. Use `xcode-select` in the terminal to change the active version
+>    of Xcode, as in `sudo xcode-select --switch
+>    /Applications/Xcode7.3.1.app/Contents/Developer/`.
+>
+> 3. Use `sudo xcode-select --install` to install the corresponding
+>    (downgraded) version of the command line tools. This is necessary
+>    or CUDA compilation will fail with odd errors.
+>
+> It can be helpful to consult the
+> [CUDA Installation Guide for Mac](http://docs.nvidia.com/cuda/pdf/CUDA_Installation_Guide_Mac.pdf).
 
 Assuming that there is only a single copy of the CUDA toolkit
 installed in your system and that it matches MATLAB's version, compile
@@ -96,9 +141,9 @@ the library with:
 
 If you have multiple versions of the CUDA toolkit, or if the script
 cannot find the toolkit for any reason, specify the path to the CUDA
-toolkit explicitly. For example, on a Mac this may look like:
+toolkit explicitly. For example, on macOS this may look like:
 
-    > vl_compilenn('enableGpu', true, 'cudaRoot', '/Developer/NVIDIA/CUDA-7.0')
+    > vl_compilenn('enableGpu', true, 'cudaRoot', '/Developer/NVIDIA/CUDA-8.0')
 
 Once more, you can use the `verbose` option to obtain more information
 if needed.
@@ -112,7 +157,7 @@ cause unforeseen issues (although none is known so far), it is
 necessary to use [recent libraries such as cuDNN](#cudnn).
 
 Compiling with a newer version of CUDA requires using the
-`cudaMethod,nvcc` option. For example, on a Mac this may look like:
+`cudaMethod,nvcc` option. For example, on macOS this may look like:
 
     > vl_compilenn('enableGpu', true, ...
                    'cudaRoot', '/Developer/NVIDIA/CUDA-7.0', ...
@@ -130,7 +175,7 @@ is to start MATLAB from the command line (terminal) specifying the
 On Windows, chances are that the CUDA libraries are already visible to
 MATLAB so that nothing else needs to be done.
 
-On Mac, this step should not be necessary as the library paths are
+On macOS, this step should not be necessary as the library paths are
 hardcoded during compilation.
 
 <a name='cudnn'></a>
@@ -153,7 +198,7 @@ Unpack the cuDNN library binaries and header files in a place
 assumed that this cuDNN RC4 has been unpacked in `local/cudnn-rc4` in
 the `<MatConvNet>` root directory,
 (i.e. `<Cudnn>`=`<MatConvNet>/local/cudnn-rc4`). For example, the
-directory structure on a Mac should look like:
+directory structure on macOS should look like:
 
      COPYING
      Makefile
@@ -172,7 +217,7 @@ directory structure on a Mac should look like:
 Use `vl_compilenn` with the `cudnnEnable,true` option to compile the
 library; do not forget to use `cudaMethod,nvcc` as, at it is likely,
 the CUDA toolkit version is newer than MATLAB's CUDA toolkit. For
-example, on Mac this may look like:
+example, on macOS this may look like:
 
     > vl_compilenn('enableGpu', true, ...
                    'cudaRoot', '/Developer/NVIDIA/CUDA-7.5', ...
@@ -191,12 +236,12 @@ On Windows, copy the cuDNN DLL file `<Cudnn>/cudnn*dll` (or from
 wherever you unpacked cuDNN) into the `<MatConvNet>/matlab/mex`
 directory.
 
-On Mac, this step should not be necessary as the library paths are
+On macOS, this step should not be necessary as the library paths are
 hardcoded during compilation.
 
 ## Further examples
 
-To compile all the features in MatConvNet on a Mac and MATLAB 2014b,
+To compile all the features in MatConvNet on macOS and MATLAB 2014b,
 CUDA toolkit 6.5 and cuDNN Release Candidate 2, use:
 
     > vl_compilenn('enableGpu', true, 'cudaMethod', 'nvcc', ...
@@ -216,5 +261,3 @@ Using MATLAB 2015b, CUDA 7.5, and cuDNN R4:
                    'cudaRoot', '/opt/local/cuda-7.5', ...
                    'enableCudnn', true, ...
                    'cudnnRoot', 'local/cudnn-rc4') ;
-
-
diff --git a/doc/site/docs/pretrained.md b/doc/site/docs/pretrained.md
index f75a9ba2..b4d57f3d 100644
--- a/doc/site/docs/pretrained.md
+++ b/doc/site/docs/pretrained.md
@@ -23,6 +23,25 @@ from the example code included in the [quickstart guide](quick.md).
 > 3.  These models are provided here for convenience, but please
 >     credit the original authors.
 
+
+## Object detection
+
+These models are trained for object detection in PASCAL VOC.
+
+- **Fast R-CNN**. Models from the [FastR-CNN](https://github.com/rbgirshick/fast-rcnn) page:
+
+    - [fast-rcnn-caffenet-pascal07-dagnn](models/fast-rcnn-caffenet-pascal07-dagnn.mat) [<i class="fa fa-file-image-o"></i>](models/fast-rcnn-caffenet-pascal07-dagnn.svg)
+    - [fast-rcnn-vggm1k-pascal07-dagnn](models/fast-rcnn-vggm1k-pascal07-dagnn.mat) [<i class="fa fa-file-image-o"></i>](models/fast-rcnn-vggm1k-pascal07-dagnn.svg)
+    - [fast-rcnn-vgg16-pascal07-dagnn](models/fast-rcnn-vgg16-pascal07-dagnn.mat) [<i class="fa fa-file-image-o"></i>](models/fast-rcnn-vgg16-pascal07-dagnn.svg)
+
+The model performance is as follows (*mAP 11* indicates mean average precision computed using 11 point interpolation, as per PASCAL VOC 07 specification):
+
+|model                                | training set | PASCAL07 test mAP | mAP 11 |
+|-------------------------------------|--------------| ------------------|--------|
+|fast-rcnn-caffenet-pascal07-dagnn    | imnet12+pas07| 57.3 %            | 58.1 % |
+|fast-rcnn-vggm12-pascal07-dagnn      | imnet12+pas07| 59.4 %            | 60.5 % |
+|fast-rcnn-vgg16-pascal07-dagnn       | imnet12+pas07| 67.3 %            | 68.7 % |
+
 ## Face recognition
 
 These models are trained for face classification and verification.
@@ -260,30 +279,33 @@ The following table summarizes the MD5 checksums for the model files.
 
 | MD5                              | File name                               |
 |----------------------------------|-----------------------------------------|
-| ed49ef44caf18496291ce0c3257b0596 | imagenet-caffe-alex.mat                 |
-| 6d69dfa6e549012c94546658737c5885 | imagenet-caffe-ref.mat                  |
-| 04cd60e8ea6a0d47742206749f624ec8 | imagenet-googlenet-dag.mat              |
-| 55743accfaf47f5c34fa50fa047143fd | imagenet-matconvnet-alex.mat            |
-| b359b6ad071155eafa35c84a78f397c7 | imagenet-matconvnet-vgg-f.mat           |
-| 1bcad2e93b0cc6da3b7d1bf610582279 | imagenet-matconvnet-vgg-m.mat           |
-| 314c982669e202e0d419803c54d1fb8f | imagenet-matconvnet-vgg-s.mat           |
-| 14ece491f7311f6dc33bc3186729de5b | imagenet-matconvnet-vgg-verydeep-16.mat |
-| be19a35a2b4f4c46ed61df684d08b900 | imagenet-resnet-101-dag.mat             |
-| 4461d3640d55aa2f58d990f7c92ff28c | imagenet-resnet-152-dag.mat             |
-| 73a3e51b75230d431c88bb795e14e91d | imagenet-resnet-50-dag.mat              |
-| f666c61dc968c413ef664a7e17b01144 | imagenet-vgg-f.mat                      |
-| d15f53a30bba3abde4377eced695adab | imagenet-vgg-m-1024.mat                 |
-| 779b86f55d0534d9fd322256372007a5 | imagenet-vgg-m-128.mat                  |
-| 9d20b7ab01ca47617e808008da6b18cc | imagenet-vgg-m-2048.mat                 |
-| 1c164950e882b4ea11623e669a86b1c4 | imagenet-vgg-m.mat                      |
-| 93b683d5420c2eeaf07a6eef492f182b | imagenet-vgg-s.mat                      |
-| 7f0f9f01dfd99c7b7088d1c5a26eb483 | imagenet-vgg-verydeep-16.mat            |
-| 49e623de543b207d57fab0f6eaf79a7e | imagenet-vgg-verydeep-19.mat            |
-| 48ccac8fb5c4961815705f1f84581ec3 | pascal-fcn16s-dag.mat                   |
-| bf3ca0a59d1525f63e7c28d526ee0656 | pascal-fcn32s-dag.mat                   |
-| 54b7ce1265a6cdd114d39d05515c73c4 | pascal-fcn8s-dag.mat                    |
-| 2a42dd1d2987983dacffc436cca5dabf | pascal-fcn8s-tvg-dag.mat                |
-| 27e94d9979dad2385f901f0c360cf3bc | vgg-face.mat                            |
+| 9dcc29b03edb5b136fda31fcd59bd025 | fast-rcnn-caffenet-pascal07-dagnn.mat   |
+| 961f997d7ff922f1ff6b7b20ad677a4c | fast-rcnn-vgg16-pascal07-dagnn.mat      |
+| f09a662aef88ac4c23d294eb1fb6f385 | fast-rcnn-vggm1k-pascal07-dagnn.mat     |
+| b5152a54bf61100a8ed61827c76e7d08 | imagenet-caffe-alex.mat                 |
+| 675dd47906d34f4d9a70fc44210d3804 | imagenet-caffe-ref.mat                  |
+| 97f4e1aa9ad6ed33fd325835710c5092 | imagenet-googlenet-dag.mat              |
+| 0998b7f66bd8dcbb78a3e75aaa6127f3 | imagenet-matconvnet-alex.mat            |
+| 790e116ec817a58960b103514891fdbf | imagenet-matconvnet-vgg-f.mat           |
+| 7e07705fc60c178ee3d2c09dab33acf3 | imagenet-matconvnet-vgg-m.mat           |
+| 82d5705d292714d0d6581a834485705b | imagenet-matconvnet-vgg-s.mat           |
+| 89a117515f66c3d7b0eb9d0516c65141 | imagenet-matconvnet-vgg-verydeep-16.mat |
+| 16ff04c36c7bd33510e4a81db6dc764b | imagenet-resnet-101-dag.mat             |
+| f399bef82f5bcaf290d07ccc818833d7 | imagenet-resnet-152-dag.mat             |
+| d72aa76a8ddf8bd96e405ac0ba827724 | imagenet-resnet-50-dag.mat              |
+| 3513562d28089bd965cc050cbf8597a6 | imagenet-vgg-f.mat                      |
+| 1410d01878346f911e991dd0c1bb983b | imagenet-vgg-m-1024.mat                 |
+| 3a8dc312a44a99d21ad43e8d96a8590f | imagenet-vgg-m-128.mat                  |
+| 087ec812e0a09980bd934e2e7ba157f6 | imagenet-vgg-m-2048.mat                 |
+| 29294d5f62578c96a3533859514235f2 | imagenet-vgg-m.mat                      |
+| dbe23da22e82078debda75842b16d5fa | imagenet-vgg-s.mat                      |
+| f72d927587ca4c97fbd165ec9cb9997f | imagenet-vgg-verydeep-16.mat            |
+| 106118b7cf60435e6d8e04f6a6dc3657 | imagenet-vgg-verydeep-19.mat            |
+| 2e49dd427829cdbc08a0154f994687d7 | pascal-fcn16s-dag.mat                   |
+| a1331885ec72a0721e51ac9d16262a48 | pascal-fcn32s-dag.mat                   |
+| 0eeb6a4bc819616ea66f88a3db878983 | pascal-fcn8s-dag.mat                    |
+| b0f7bd5833b555c6241dd0c05897ca41 | pascal-fcn8s-tvg-dag.mat                |
+| 3d6cd504bf9c98af4a561aad059565d1 | vgg-face.mat                            |
 
 ## Older file versions
 
diff --git a/doc/site/docs/quick.md b/doc/site/docs/quick.md
index 4335dfed..dd55f7e3 100644
--- a/doc/site/docs/quick.md
+++ b/doc/site/docs/quick.md
@@ -11,8 +11,8 @@ speed, downloading the CNN model may require some time.
 
 ```matlab
 % Install and compile MatConvNet (needed once).
-untar('http://www.vlfeat.org/matconvnet/download/matconvnet-1.0-beta22.tar.gz') ;
-cd matconvnet-1.0-beta22
+untar('http://www.vlfeat.org/matconvnet/download/matconvnet-1.0-beta24.tar.gz') ;
+cd matconvnet-1.0-beta24
 run matlab/vl_compilenn ;
 
 % Download a pre-trained CNN from the web (needed once).
diff --git a/doc/site/mkdocs.yml b/doc/site/mkdocs.yml
index e24a5c3e..a268e24c 100644
--- a/doc/site/mkdocs.yml
+++ b/doc/site/mkdocs.yml
@@ -1,5 +1,5 @@
 site_name: MatConvNet
-markdown_extensions: ['extra', 'mathjax', 'toc']
+markdown_extensions: ['extra', 'math', 'toc']
 theme_dir: theme
 
 extra_css: ['css/fixes.css']
@@ -37,6 +37,7 @@ pages:
   - vl_nnnormalize: 'mfiles/vl_nnnormalize.md'
   - vl_nnpool: 'mfiles/vl_nnpool.md'
   - vl_nnrelu: 'mfiles/vl_nnrelu.md'
+  - vl_nnroipool: 'mfiles/vl_nnroipool.md'
   - vl_nnsigmoid: 'mfiles/vl_nnsigmoid.md'
   - vl_nnsoftmax: 'mfiles/vl_nnsoftmax.md'
   - vl_nnsoftmaxloss: 'mfiles/vl_nnsoftmaxloss.md'
@@ -53,6 +54,7 @@ pages:
   - vl_imreadjpeg: 'mfiles/vl_imreadjpeg.md'
   - vl_taccum: 'mfiles/vl_taccum.md'
   - vl_tmove: 'mfiles/vl_tmove.md'
+  - vl_tshow: 'mfiles/vl_tshow.md'
 
 - Contributing:
   - Developers notes: 'developers.md'
diff --git a/examples/+solver/adadelta.m b/examples/+solver/adadelta.m
new file mode 100644
index 00000000..c13d5d4a
--- /dev/null
+++ b/examples/+solver/adadelta.m
@@ -0,0 +1,42 @@
+function [w, state] = adadelta(w, state, grad, opts, ~)
+%ADADELTA
+%   Example AdaDelta solver, for use with CNN_TRAIN and CNN_TRAIN_DAG.
+%
+%   AdaDelta sets its own learning rate, so any learning rate set in the
+%   options of CNN_TRAIN and CNN_TRAIN_DAG will be ignored.
+%
+%   If called without any input argument, returns the default options
+%   structure.
+%
+%   Solver options: (opts.train.solverOpts)
+%
+%   `epsilon`:: 1e-6
+%      Small additive constant to regularize variance estimate.
+%
+%   `rho`:: 0.9
+%      Moving average window for variance update, between 0 and 1 (larger
+%      values result in slower/more stable updating).
+
+% Copyright (C) 2016 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if nargin == 0  % Return the default solver options
+  w = struct('epsilon', 1e-6, 'rho', 0.9) ;
+  return ;
+end
+
+if isequal(state, 0)  % First iteration, initialize state struct
+  state = struct('g_sqr', 0, 'delta_sqr', 0) ;
+end
+
+rho = opts.rho ;
+
+state.g_sqr = state.g_sqr * rho + grad.^2 * (1 - rho) ;
+new_delta = -sqrt((state.delta_sqr + opts.epsilon) ./ ...
+                  (state.g_sqr + opts.epsilon)) .* grad ;
+state.delta_sqr = state.delta_sqr * rho + new_delta.^2 * (1 - rho) ;
+
+w = w + new_delta ;
diff --git a/examples/+solver/adagrad.m b/examples/+solver/adagrad.m
new file mode 100644
index 00000000..69d66fd4
--- /dev/null
+++ b/examples/+solver/adagrad.m
@@ -0,0 +1,43 @@
+function [w, g_sqr] = adagrad(w, g_sqr, grad, opts, lr)
+%ADAGRAD
+%   Example AdaGrad solver, for use with CNN_TRAIN and CNN_TRAIN_DAG.
+%
+%   Set the initial learning rate for AdaGrad in the options for
+%   CNN_TRAIN and CNN_TRAIN_DAG. Note that a learning rate that works for
+%   SGD may be inappropriate for AdaGrad; the default is 0.001.
+%
+%   If called without any input argument, returns the default options
+%   structure.
+%
+%   Solver options: (opts.train.solverOpts)
+%
+%   `epsilon`:: 1e-10
+%      Small additive constant to regularize variance estimate.
+%
+%   `rho`:: 1
+%      Moving average window for variance update, between 0 and 1 (larger
+%      values result in slower/more stable updating). This is similar to
+%      RHO in AdaDelta and RMSProp. Standard AdaGrad is obtained with a RHO
+%      value of 1 (use total average instead of a moving average).
+%
+%   A possibly undesirable effect of standard AdaGrad is that the update
+%   will monotonically decrease to 0, until training eventually stops. This
+%   is because the AdaGrad update is inversely proportional to the total
+%   variance of the gradients seen so far.
+%   With RHO smaller than 1, a moving average is used instead. This
+%   prevents the final update from monotonically decreasing to 0.
+
+% Copyright (C) 2016 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if nargin == 0  % Return the default solver options
+  w = struct('epsilon', 1e-10, 'rho', 1) ;
+  return ;
+end
+
+g_sqr = g_sqr * opts.rho + grad.^2 ;
+
+w = w - lr * grad ./ (sqrt(g_sqr) + opts.epsilon) ;
diff --git a/examples/+solver/adam.m b/examples/+solver/adam.m
new file mode 100644
index 00000000..f710c4c7
--- /dev/null
+++ b/examples/+solver/adam.m
@@ -0,0 +1,75 @@
+function [w, state] = adam(w, state, grad, opts, lr)
+%ADAM
+%   Adam solver for use with CNN_TRAIN and CNN_TRAIN_DAG
+%
+%   See [Kingma et. al., 2014](http://arxiv.org/abs/1412.6980)
+%    |  ([pdf](http://arxiv.org/pdf/1412.6980.pdf)).
+%
+%   If called without any input argument, returns the default options
+%   structure. Otherwise provide all input arguments.
+%   
+%   W is the vector/matrix/tensor of parameters. It can be single/double
+%   precision and can be a `gpuArray`.
+%
+%   STATE is as defined below and so are supported OPTS.
+%
+%   GRAD is the gradient of the objective w.r.t W
+%
+%   LR is the learning rate, referred to as \alpha by Algorithm 1 in 
+%   [Kingma et. al., 2014].
+%
+%   Solver options: (opts.train.solverOpts)
+%
+%   `beta1`:: 0.9
+%      Decay for 1st moment vector. See algorithm 1 in [Kingma et.al. 2014]
+%
+%   `beta2`:: 0.999
+%      Decay for 2nd moment vector
+%
+%   `eps`:: 1e-8
+%      Additive offset when dividing by state.v
+%
+%   The state is initialized as 0 (number) to start with. The first call to
+%   this function will initialize it with the default state consisting of
+%
+%   `m`:: 0
+%      First moment vector
+%
+%   `v`:: 0
+%      Second moment vector
+%
+%   `t`:: 0
+%      Global iteration number across epochs
+%
+%   This implementation borrowed from torch optim.adam
+
+% Copyright (C) 2016 Aravindh Mahendran.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if nargin == 0 % Returns the default solver options
+  w = struct('beta1', 0.9, 'beta2', 0.999, 'eps', 1e-8) ;
+  return ;
+end
+
+if isequal(state, 0) % start off with state = 0 so as to get default state
+  state = struct('m', 0, 'v', 0, 't', 0);
+end
+
+% update first moment vector `m`
+state.m = opts.beta1 * state.m + (1 - opts.beta1) * grad ;
+
+% update second moment vector `v`
+state.v = opts.beta2 * state.v + (1 - opts.beta2) * grad.^2 ;
+
+% update the time step
+state.t = state.t + 1 ;
+
+% This implicitly corrects for biased estimates of first and second moment
+% vectors
+lr_t = lr * (((1 - opts.beta2^state.t)^0.5) / (1 - opts.beta1^state.t)) ;
+
+% Update `w`
+w = w - lr_t * state.m ./ (state.v.^0.5 + opts.eps) ;
diff --git a/examples/+solver/rmsprop.m b/examples/+solver/rmsprop.m
new file mode 100644
index 00000000..f1ae96e6
--- /dev/null
+++ b/examples/+solver/rmsprop.m
@@ -0,0 +1,34 @@
+function [w, g_sqr] = rmsprop(w, g_sqr, grad, opts, lr)
+%RMSPROP
+%   Example RMSProp solver, for use with CNN_TRAIN and CNN_TRAIN_DAG.
+%
+%   Set the initial learning rate for RMSProp in the options for
+%   CNN_TRAIN and CNN_TRAIN_DAG. Note that a learning rate that works for
+%   SGD may be inappropriate for RMSProp; the default is 0.001.
+%
+%   If called without any input argument, returns the default options
+%   structure.
+%
+%   Solver options: (opts.train.solverOpts)
+%
+%   `epsilon`:: 1e-8
+%      Small additive constant to regularize variance estimate.
+%
+%   `rho`:: 0.99
+%      Moving average window for variance update, between 0 and 1 (larger
+%      values result in slower/more stable updating).
+
+% Copyright (C) 2016 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if nargin == 0  % Return the default solver options
+  w = struct('epsilon', 1e-8, 'rho', 0.99) ;
+  return ;
+end
+
+g_sqr = g_sqr * opts.rho + grad.^2 * (1 - opts.rho) ;
+
+w = w - lr * grad ./ (sqrt(g_sqr) + opts.epsilon) ;
diff --git a/examples/cnn_train.m b/examples/cnn_train.m
index cab63a48..99edd5db 100644
--- a/examples/cnn_train.m
+++ b/examples/cnn_train.m
@@ -16,6 +16,7 @@
 %
 % This file is part of the VLFeat library and is made available under
 % the terms of the BSD license (see the COPYING file).
+addpath(fullfile(vl_rootnn, 'examples'));
 
 opts.expDir = fullfile('data','exp') ;
 opts.continue = true ;
@@ -24,12 +25,23 @@
 opts.train = [] ;
 opts.val = [] ;
 opts.gpus = [] ;
+opts.epochSize = inf;
 opts.prefetch = false ;
 opts.numEpochs = 300 ;
 opts.learningRate = 0.001 ;
 opts.weightDecay = 0.0005 ;
+
+opts.solver = [] ;  % Empty array means use the default SGD solver
+[opts, varargin] = vl_argparse(opts, varargin) ;
+if ~isempty(opts.solver)
+  assert(isa(opts.solver, 'function_handle') && nargout(opts.solver) == 2,...
+    'Invalid solver; expected a function handle with two outputs.') ;
+  % Call without input arguments, to get default options
+  opts.solverOpts = opts.solver() ;
+end
+
 opts.momentum = 0.9 ;
-opts.saveMomentum = true ;
+opts.saveSolverState = true ;
 opts.nesterovUpdate = false ;
 opts.randomSeed = 0 ;
 opts.memoryMapFile = fullfile(tempdir, 'matconvnet.bin') ;
@@ -45,13 +57,18 @@
 opts.errorLabels = {} ;
 opts.plotDiagnostics = false ;
 opts.plotStatistics = true;
+opts.postEpochFn = [] ;  % postEpochFn(net,params,state) called after each epoch; can return a new learning rate, 0 to stop, [] for no change
 opts = vl_argparse(opts, varargin) ;
 
 if ~exist(opts.expDir, 'dir'), mkdir(opts.expDir) ; end
 if isempty(opts.train), opts.train = find(imdb.images.set==1) ; end
 if isempty(opts.val), opts.val = find(imdb.images.set==2) ; end
-if isnan(opts.train), opts.train = [] ; end
-if isnan(opts.val), opts.val = [] ; end
+if isscalar(opts.train) && isnumeric(opts.train) && isnan(opts.train)
+  opts.train = [] ;
+end
+if isscalar(opts.val) && isnumeric(opts.val) && isnan(opts.val)
+  opts.val = [] ;
+end
 
 % -------------------------------------------------------------------------
 %                                                            Initialization
@@ -124,6 +141,7 @@
   params.epoch = epoch ;
   params.learningRate = opts.learningRate(min(epoch, numel(opts.learningRate))) ;
   params.train = opts.train(randperm(numel(opts.train))) ; % shuffle
+  params.train = params.train(1:min(opts.epochSize, numel(opts.train)));
   params.val = opts.val(randperm(numel(opts.val))) ;
   params.imdb = imdb ;
   params.getBatch = getBatch ;
@@ -150,7 +168,9 @@
   stats.train(epoch) = lastStats.train ;
   stats.val(epoch) = lastStats.val ;
   clear lastStats ;
-  saveStats(modelPath(epoch), stats) ;
+  if ~evaluateMode
+    saveStats(modelPath(epoch), stats) ;
+  end
 
   if params.plotStatistics
     switchFigure(1) ; clf ;
@@ -180,6 +200,16 @@
     drawnow ;
     print(1, modelFigPath, '-dpdf') ;
   end
+  
+  if ~isempty(opts.postEpochFn)
+    if nargout(opts.postEpochFn) == 0
+      opts.postEpochFn(net, params, state) ;
+    else
+      lr = opts.postEpochFn(net, params, state) ;
+      if ~isempty(lr), opts.learningRate = lr; end
+      if opts.learningRate == 0, break; end
+    end
+  end
 end
 
 % With multiple GPUs, return one copy
@@ -230,11 +260,10 @@
 % spmd caller.
 
 % initialize with momentum 0
-if isempty(state) || isempty(state.momentum)
+if isempty(state) || isempty(state.solverState)
   for i = 1:numel(net.layers)
-    for j = 1:numel(net.layers{i}.weights)
-      state.momentum{i}{j} = 0 ;
-    end
+    state.solverState{i} = cell(1, numel(net.layers{i}.weights)) ;
+    state.solverState{i}(:) = {0} ;
   end
 end
 
@@ -242,9 +271,14 @@
 numGpus = numel(params.gpus) ;
 if numGpus >= 1
   net = vl_simplenn_move(net, 'gpu') ;
-  for i = 1:numel(state.momentum)
-    for j = 1:numel(state.momentum{i})
-      state.momentum{i}{j} = gpuArray(state.momentum{i}{j}) ;
+  for i = 1:numel(state.solverState)
+    for j = 1:numel(state.solverState{i})
+      s = state.solverState{i}{j} ;
+      if isnumeric(s)
+        state.solverState{i}{j} = gpuArray(s) ;
+      elseif isstruct(s)
+        state.solverState{i}{j} = structfun(@gpuArray, s, 'UniformOutput', false) ;
+      end
     end
   end
 end
@@ -370,7 +404,7 @@
       'XScale', 'log', ...
       'XLim', [1e-5 1], ...
       'XTick', 10.^(-5:1)) ;
-    grid on ;
+    grid on ; title('Variation');
     subplot(2,2,2) ; barh(sqrt(diagnpow)) ;
     set(gca,'TickLabelInterpreter', 'none', ...
       'YTick', 1:numel(diagnpow), ...
@@ -379,7 +413,7 @@
       'XScale', 'log', ...
       'XLim', [1e-5 1e5], ...
       'XTick', 10.^(-5:5)) ;
-    grid on ;
+    grid on ; title('Power');
     subplot(2,2,3); plot(squeeze(res(end-1).x)) ;
     drawnow ;
   end
@@ -396,12 +430,17 @@
     mpiprofile off ;
   end
 end
-if ~params.saveMomentum
-  state.momentum = [] ;
+if ~params.saveSolverState
+  state.solverState = [] ;
 else
-  for i = 1:numel(state.momentum)
-    for j = 1:numel(state.momentum{i})
-      state.momentum{i}{j} = gather(state.momentum{i}{j}) ;
+  for i = 1:numel(state.solverState)
+    for j = 1:numel(state.solverState{i})
+      s = state.solverState{i}{j} ;
+      if isnumeric(s)
+        state.solverState{i}{j} = gather(s) ;
+      elseif isstruct(s)
+        state.solverState{i}{j} = structfun(@gather, s, 'UniformOutput', false) ;
+      end
     end
   end
 end
@@ -437,28 +476,37 @@
       thisDecay = params.weightDecay * net.layers{l}.weightDecay(j) ;
       thisLR = params.learningRate * net.layers{l}.learningRate(j) ;
 
-      % Normalize gradient and incorporate weight decay.
-      parDer = vl_taccum(1/batchSize, parDer, ...
-                         thisDecay, net.layers{l}.weights{j}) ;
+      if thisLR>0 || thisDecay>0
+        % Normalize gradient and incorporate weight decay.
+        parDer = vl_taccum(1/batchSize, parDer, ...
+                           thisDecay, net.layers{l}.weights{j}) ;
+
+        if isempty(params.solver)
+          % Default solver is the optimised SGD.
+          % Update momentum.
+          state.solverState{l}{j} = vl_taccum(...
+            params.momentum, state.solverState{l}{j}, ...
+            -1, parDer) ;
+
+          % Nesterov update (aka one step ahead).
+          if params.nesterovUpdate
+            delta = params.momentum * state.solverState{l}{j} - parDer ;
+          else
+            delta = state.solverState{l}{j} ;
+          end
 
-      % Update momentum.
-      state.momentum{l}{j} = vl_taccum(...
-        params.momentum, state.momentum{l}{j}, ...
-        -1, parDer) ;
+          % Update parameters.
+          net.layers{l}.weights{j} = vl_taccum(...
+            1, net.layers{l}.weights{j}, ...
+            thisLR, delta) ;
 
-      % Nesterov update (aka one step ahead).
-      if params.nesterovUpdate
-        delta = vl_taccum(...
-          params.momentum, state.momentum{l}{j}, ...
-          -1, parDer) ;
-      else
-        delta = state.momentum{l}{j} ;
+        else
+          % call solver function to update weights
+          [net.layers{l}.weights{j}, state.solverState{l}{j}] = ...
+            params.solver(net.layers{l}.weights{j}, state.solverState{l}{j}, ...
+            parDer, params.solverOpts, thisLR) ;
+        end
       end
-
-      % Update parameters.
-      net.layers{l}.weights{j} = vl_taccum(...
-        1, net.layers{l}.weights{j}, ...
-        thisLR, delta) ;
     end
 
     % if requested, collect some useful stats for debugging
@@ -467,7 +515,9 @@
       label = '' ;
       switch net.layers{l}.type
         case {'conv','convt'}
-          variation = thisLR * mean(abs(state.momentum{l}{j}(:))) ;
+          if isnumeric(state.solverState{l}{j})
+            variation = thisLR * mean(abs(state.solverState{l}{j}(:))) ;
+          end
           power = mean(res(l+1).x(:).^2) ;
           if j == 1 % fiters
             base = mean(net.layers{l}.weights{j}(:).^2) ;
diff --git a/examples/cnn_train_dag.m b/examples/cnn_train_dag.m
index 25cbff46..b1898cc3 100644
--- a/examples/cnn_train_dag.m
+++ b/examples/cnn_train_dag.m
@@ -8,6 +8,7 @@
 %
 % This file is part of the VLFeat library and is made available under
 % the terms of the BSD license (see the COPYING file).
+addpath(fullfile(vl_rootnn, 'examples'));
 
 opts.expDir = fullfile('data','exp') ;
 opts.continue = true ;
@@ -17,11 +18,22 @@
 opts.val = [] ;
 opts.gpus = [] ;
 opts.prefetch = false ;
+opts.epochSize = inf;
 opts.numEpochs = 300 ;
 opts.learningRate = 0.001 ;
 opts.weightDecay = 0.0005 ;
+
+opts.solver = [] ;  % Empty array means use the default SGD solver
+[opts, varargin] = vl_argparse(opts, varargin) ;
+if ~isempty(opts.solver)
+  assert(isa(opts.solver, 'function_handle') && nargout(opts.solver) == 2,...
+    'Invalid solver; expected a function handle with two outputs.') ;
+  % Call without input arguments, to get default options
+  opts.solverOpts = opts.solver() ;
+end
+
 opts.momentum = 0.9 ;
-opts.saveMomentum = true ;
+opts.saveSolverState = true ;
 opts.nesterovUpdate = false ;
 opts.randomSeed = 0 ;
 opts.profile = false ;
@@ -31,13 +43,18 @@
 opts.derOutputs = {'objective', 1} ;
 opts.extractStatsFn = @extractStats ;
 opts.plotStatistics = true;
+opts.postEpochFn = [] ;  % postEpochFn(net,params,state) called after each epoch; can return a new learning rate, 0 to stop, [] for no change
 opts = vl_argparse(opts, varargin) ;
 
 if ~exist(opts.expDir, 'dir'), mkdir(opts.expDir) ; end
 if isempty(opts.train), opts.train = find(imdb.images.set==1) ; end
 if isempty(opts.val), opts.val = find(imdb.images.set==2) ; end
-if isnan(opts.train), opts.train = [] ; end
-if isnan(opts.val), opts.val = [] ; end
+if isscalar(opts.train) && isnumeric(opts.train) && isnan(opts.train)
+  opts.train = [] ;
+end
+if isscalar(opts.val) && isnumeric(opts.val) && isnan(opts.val)
+  opts.val = [] ;
+end
 
 % -------------------------------------------------------------------------
 %                                                            Initialization
@@ -79,6 +96,7 @@
   params.epoch = epoch ;
   params.learningRate = opts.learningRate(min(epoch, numel(opts.learningRate))) ;
   params.train = opts.train(randperm(numel(opts.train))) ; % shuffle
+  params.train = params.train(1:min(opts.epochSize, numel(opts.train)));
   params.val = opts.val(randperm(numel(opts.val))) ;
   params.imdb = imdb ;
   params.getBatch = getBatch ;
@@ -135,6 +153,16 @@
     drawnow ;
     print(1, modelFigPath, '-dpdf') ;
   end
+  
+  if ~isempty(opts.postEpochFn)
+    if nargout(opts.postEpochFn) == 0
+      opts.postEpochFn(net, params, state) ;
+    else
+      lr = opts.postEpochFn(net, params, state) ;
+      if ~isempty(lr), opts.learningRate = lr; end
+      if opts.learningRate == 0, break; end
+    end
+  end
 end
 
 % With multiple GPUs, return one copy
@@ -148,15 +176,23 @@
 % spmd caller.
 
 % initialize with momentum 0
-if isempty(state) || isempty(state.momentum)
-  state.momentum = num2cell(zeros(1, numel(net.params))) ;
+if isempty(state) || isempty(state.solverState)
+  state.solverState = cell(1, numel(net.params)) ;
+  state.solverState(:) = {0} ;
 end
 
 % move CNN  to GPU as needed
 numGpus = numel(params.gpus) ;
 if numGpus >= 1
   net.move('gpu') ;
-  state.momentum = cellfun(@gpuArray, state.momentum, 'uniformoutput', false) ;
+  for i = 1:numel(state.solverState)
+    s = state.solverState{i} ;
+    if isnumeric(s)
+      state.solverState{i} = gpuArray(s) ;
+    elseif isstruct(s)
+      state.solverState{i} = structfun(@gpuArray, s, 'UniformOutput', false) ;
+    end
+  end
 end
 if numGpus > 1
   parserv = ParameterServer(params.parameterServer) ;
@@ -260,10 +296,17 @@
     mpiprofile off ;
   end
 end
-if ~params.saveMomentum
-  state.momentum = [] ;
+if ~params.saveSolverState
+  state.solverState = [] ;
 else
-  state.momentum = cellfun(@gather, state.momentum, 'uniformoutput', false) ;
+  for i = 1:numel(state.solverState)
+    s = state.solverState{i} ;
+    if isnumeric(s)
+      state.solverState{i} = gather(s) ;
+    elseif isstruct(s)
+      state.solverState{i} = structfun(@gather, s, 'UniformOutput', false) ;
+    end
+  end
 end
 
 net.reset() ;
@@ -295,28 +338,36 @@
       thisDecay = params.weightDecay * net.params(p).weightDecay ;
       thisLR = params.learningRate * net.params(p).learningRate ;
 
-      % Normalize gradient and incorporate weight decay.
-      parDer = vl_taccum(1/batchSize, parDer, ...
-                         thisDecay, net.params(p).value) ;
-
-      % Update momentum.
-      state.momentum{p} = vl_taccum(...
-        params.momentum, state.momentum{p}, ...
-        -1, parDer) ;
-
-      % Nesterov update (aka one step ahead).
-      if params.nesterovUpdate
-        delta = vl_taccum(...
-          params.momentum, state.momentum{p}, ...
-          -1, parDer) ;
-      else
-        delta = state.momentum{p} ;
+      if thisLR>0 || thisDecay>0
+        % Normalize gradient and incorporate weight decay.
+        parDer = vl_taccum(1/batchSize, parDer, ...
+                           thisDecay, net.params(p).value) ;
+
+        if isempty(params.solver)
+          % Default solver is the optimised SGD.
+          % Update momentum.
+          state.solverState{p} = vl_taccum(...
+            params.momentum, state.solverState{p}, ...
+            -1, parDer) ;
+
+          % Nesterov update (aka one step ahead).
+          if params.nesterovUpdate
+            delta = params.momentum * state.solverState{p} - parDer ;
+          else
+            delta = state.solverState{p} ;
+          end
+
+          % Update parameters.
+          net.params(p).value = vl_taccum(...
+            1,  net.params(p).value, thisLR, delta) ;
+
+        else
+          % call solver function to update weights
+          [net.params(p).value, state.solverState{p}] = ...
+            params.solver(net.params(p).value, state.solverState{p}, ...
+            parDer, params.solverOpts, thisLR) ;
+        end
       end
-
-      % Update parameters.
-      net.params(p).value = vl_taccum(...
-        1,  net.params(p).value, thisLR, delta) ;
-
     otherwise
       error('Unknown training method ''%s'' for parameter ''%s''.', ...
         net.params(p).trainMethod, ...
@@ -362,6 +413,7 @@
 % -------------------------------------------------------------------------
 sel = find(cellfun(@(x) isa(x,'dagnn.Loss'), {net.layers.block})) ;
 for i = 1:numel(sel)
+  if net.layers(sel(i)).block.ignoreAverage, continue; end;
   stats.(net.layers(sel(i)).outputs{1}) = net.layers(sel(i)).block.average ;
 end
 
diff --git a/examples/custom_imdb/cnn_toy_data.m b/examples/custom_imdb/cnn_toy_data.m
new file mode 100644
index 00000000..59c2b212
--- /dev/null
+++ b/examples/custom_imdb/cnn_toy_data.m
@@ -0,0 +1,155 @@
+function [net, stats] = cnn_toy_data(varargin)
+% CNN_TOY_DATA
+% Minimal demonstration of MatConNet training of a CNN on toy data.
+%
+% It also serves as a short tutorial on creating and using a custom imdb
+% (image database).
+%
+% The task is to distinguish between images of triangles, squares and
+% circles.
+
+% Copyright (C) 2017 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+run([fileparts(mfilename('fullpath')) '/../../matlab/vl_setupnn.m']) ;
+
+% Parameter defaults. You can add any custom parameters here (e.g.
+% opts.alpha = 1), and change them when calling: cnn_toy_data('alpha', 2).
+opts.train.batchSize = 200 ;
+opts.train.numEpochs = 10 ;
+opts.train.continue = true ;
+opts.train.gpus = [] ;
+opts.train.learningRate = 0.01 ;
+opts.train.expDir = [vl_rootnn '/data/toy'] ;
+opts.dataDir = [vl_rootnn '/data/toy-dataset'] ;
+[opts, varargin] = vl_argparse(opts, varargin) ;
+
+opts.imdbPath = [opts.train.expDir '/imdb.mat'] ;
+opts = vl_argparse(opts, varargin) ;
+
+% --------------------------------------------------------------------
+%                                                         Prepare data
+% --------------------------------------------------------------------
+
+% Generate images if they don't exist (this would be skipped for real data)
+if ~exist(opts.dataDir, 'dir')
+  mkdir(opts.dataDir) ;
+  cnn_toy_data_generator(opts.dataDir) ;
+end
+
+% Create image database (imdb struct). It can be cached to a file for speed
+if exist(opts.imdbPath, 'file')
+  disp('Reloading image database...')
+  imdb = load(opts.imdbPath) ;
+else
+  disp('Creating image database...')
+  imdb = getImdb(opts.dataDir) ;
+  mkdir(fileparts(opts.imdbPath)) ;
+  save(opts.imdbPath, '-struct', 'imdb') ;
+end
+
+% Create network (see HELP VL_SIMPLENN)
+f = 1/100 ;
+net.layers = {} ;
+net.layers{end+1} = struct('type', 'conv', ...
+                           'weights', {{f*randn(5,5,1,5, 'single'), zeros(1, 5, 'single')}}) ;
+net.layers{end+1} = struct('type', 'pool', ...
+                           'method', 'max', ...
+                           'pool', [2 2], ...
+                           'stride', 2) ;
+net.layers{end+1} = struct('type', 'conv', ...
+                           'weights', {{f*randn(5,5,5,10, 'single'),zeros(1,10,'single')}}) ;
+net.layers{end+1} = struct('type', 'pool', ...
+                           'method', 'max', ...
+                           'pool', [2 2], ...
+                           'stride', 2) ;
+net.layers{end+1} = struct('type', 'conv', ...
+                           'weights', {{f*randn(5,5,10,3, 'single'),  zeros(1,3,'single')}}) ;
+net.layers{end+1} = struct('type', 'softmaxloss') ;
+
+% Fill in any values we didn't specify explicitly
+net = vl_simplenn_tidy(net) ;
+
+
+% --------------------------------------------------------------------
+%                                                                Train
+% --------------------------------------------------------------------
+
+use_gpu = ~isempty(opts.train.gpus) ;
+
+% Start training
+[net, stats] = cnn_train(net, imdb, @(imdb, batch) getBatch(imdb, batch, use_gpu), ...
+  'train', find(imdb.set == 1), 'val', find(imdb.set == 2), opts.train) ;
+
+% Visualize the learned filters
+figure(3) ; vl_tshow(net.layers{1}.weights{1}) ; title('Conv1 filters') ;
+figure(4) ; vl_tshow(net.layers{3}.weights{1}) ; title('Conv2 filters') ;
+figure(5) ; vl_tshow(net.layers{5}.weights{1}) ; title('Conv3 filters') ;
+
+
+% --------------------------------------------------------------------
+function [images, labels] = getBatch(imdb, batch, use_gpu)
+% --------------------------------------------------------------------
+% This is where we return a given set of images (and their labels) from
+% our imdb structure.
+% If the dataset was too large to fit in memory, getBatch could load images
+% from disk instead (with indexes given in 'batch').
+
+images = imdb.images(:,:,:,batch) ;
+labels = imdb.labels(batch) ;
+
+if use_gpu
+  images = gpuArray(images) ;
+end
+
+% --------------------------------------------------------------------
+function imdb = getImdb(dataDir)
+% --------------------------------------------------------------------
+% Initialize the imdb structure (image database).
+% Note the fields are arbitrary: only your getBatch needs to understand it.
+% The field imdb.set is used to distinguish between the training and
+% validation sets, and is only used in the above call to cnn_train.
+
+% The sets, and number of samples per label in each set
+sets = {'train', 'val'} ;
+numSamples = [1500, 150] ;
+
+% Preallocate memory
+totalSamples = 4950 ;  % 3 * 1500 + 3 * 150
+images = zeros(32, 32, 1, totalSamples, 'single') ;
+labels = zeros(totalSamples, 1) ;
+set = ones(totalSamples, 1) ;
+
+% Read all samples
+sample = 1 ;
+for s = 1:2  % Iterate sets
+  for label = 1:3  % Iterate labels
+    for i = 1:numSamples(s)  % Iterate samples
+      % Read image
+      im = imread(sprintf('%s/%s/%i/%04i.png', dataDir, sets{s}, label, i)) ;
+      
+      % Store it, along with label and train/val set information
+      images(:,:,:,sample) = single(im) ;
+      labels(sample) = label ;
+      set(sample) = s ;
+      sample = sample + 1 ;
+    end
+  end
+end
+
+% Show some random example images
+figure(2) ;
+montage(images(:,:,:,randperm(totalSamples, 100))) ;
+title('Example images') ;
+
+% Remove mean over whole dataset
+images = bsxfun(@minus, images, mean(images, 4)) ;
+
+% Store results in the imdb struct
+imdb.images = images ;
+imdb.labels = labels ;
+imdb.set = set ;
+
diff --git a/examples/custom_imdb/cnn_toy_data_generator.m b/examples/custom_imdb/cnn_toy_data_generator.m
new file mode 100644
index 00000000..cbe9d2d1
--- /dev/null
+++ b/examples/custom_imdb/cnn_toy_data_generator.m
@@ -0,0 +1,51 @@
+function cnn_toy_data_generator(dataDir)
+%CNN_TOY_DATA_GENERATOR
+%   Generates toy data in the given path: random image of triangles,
+%   squares and circles.
+%
+%   The directory format is: '<dataDir>/<set>/<label>/<sample>.png', where
+%   <set> is 'train' or 'val', <label> is an integer between 1 and 3, and
+%   <sample> is the sample index.
+
+% Copyright (C) 2017 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+  % Set random seed
+  rng('default') ;
+  rng(0) ;
+
+  % The sets, and number of samples per label in each set
+  sets = {'train', 'val'} ;
+  numSamples = [1500, 150] ;
+
+  % Number of polygon points in each class. The circle is created with 50
+  % points.
+  numPoints = [3, 4, 50] ;
+  
+  for s = 1:2  % Iterate sets
+    for label = 1:3  % Iterate labels
+      fprintf('Generating images for set %s, label %i...\n', sets{s}, label) ;
+      
+      mkdir(sprintf('%s/%s/%i', dataDir, sets{s}, label)) ;
+      
+      for i = 1:numSamples(s)  % Iterate samples
+        % Points of a regular polygon, with random rotation and scale
+        radius = randi([11, 14]) ;
+        angles = rand(1) * 2 * pi + (0 : 2 * pi / numPoints(label) : 2 * pi) ;
+        xs = 16.5 + cos(angles) * radius ;
+        ys = 16.5 + sin(angles) * radius ;
+
+        % Generate image
+        image = poly2mask(xs, ys, 32, 32) ;
+        
+        % Save it
+        imwrite(image, sprintf('%s/%s/%i/%04i.png', dataDir, sets{s}, label, i)) ;
+      end
+    end
+  end
+
+end
+
diff --git a/examples/fast_rcnn/+dagnn/LossSmoothL1.m b/examples/fast_rcnn/+dagnn/LossSmoothL1.m
new file mode 100644
index 00000000..0c410b54
--- /dev/null
+++ b/examples/fast_rcnn/+dagnn/LossSmoothL1.m
@@ -0,0 +1,68 @@
+classdef LossSmoothL1 < dagnn.Loss
+%LossSmoothL1  Smooth L1 loss
+%  `LossSmoothL1.forward({x, x0, w})` computes the smooth L1 distance 
+%  between `x` and `x0`, weighting the elements by `w`.
+%
+%  Here the smooth L1 loss between two vectors is defined as:
+%
+%     Loss = sum_i f(x_i - x0_i) w_i.
+%
+%  where f is the function (following the Faster R-CNN definition):
+%
+%              { 0.5 * sigma^2 * delta^2,         if |delta| < 1 / sigma^2,
+%   f(delta) = {
+%              { |delta| - 0.5 / sigma^2,         otherwise.
+%
+%  In practice, `x` and `x0` can pack multiple instances as 1 x 1 x C
+%  x N arrays (or simply C x N arrays).
+
+  properties
+    sigma = 1.
+  end
+
+  methods
+    function outputs = forward(obj, inputs, params)
+      sigma2 = obj.sigma^2 ;
+      delta = inputs{1} - inputs{2} ;
+      absDelta = abs(delta) ;
+
+      linearRegion = (absDelta > 1. / sigma2) ;
+      absDelta(linearRegion) = absDelta(linearRegion) - 0.5/sigma2 ;
+      absDelta(~linearRegion) = 0.5 * sigma2 * absDelta(~linearRegion).^2 ;
+
+      % Mutliply by instance weights and sum.
+      outputs{1} = inputs{3}(:)' * absDelta(:) ;
+
+      % Accumulate loss statistics.
+      if obj.ignoreAverage, return; end;
+      n = obj.numAveraged ;
+      m = n + gather(sum(inputs{3}(:))) + 1e-9 ;
+      obj.average = (n * obj.average + gather(outputs{1})) / m ;
+      obj.numAveraged = m ;
+    end
+
+    function [derInputs, derParams] = backward(obj, inputs, params, derOutputs)
+    % Function derivative:
+    %
+    %          { sigma^2 * x,             if |x| < 1 / sigma^2,
+    %  f'(x) = {
+    %          { sign(x),                 otherwise.
+
+      sigma2 = obj.sigma^2 ;
+      delta = inputs{1} - inputs{2} ;
+      absDelta = abs(delta) ;
+
+      linearRegion = (absDelta > 1. / sigma2) ;
+      delta(linearRegion) = sign(delta(linearRegion));
+      delta(~linearRegion) = sigma2 * delta(~linearRegion) ;
+
+      derInputs = {inputs{3} .* delta .* derOutputs{1}, [], []} ;
+      derParams = {} ;
+    end
+
+    function obj = LossSmoothL1(varargin)
+      obj.load(varargin) ;
+      obj.loss = 'smoothl1';
+    end
+  end
+end
diff --git a/examples/fast_rcnn/000004.jpg b/examples/fast_rcnn/000004.jpg
new file mode 100644
index 00000000..832688c1
Binary files /dev/null and b/examples/fast_rcnn/000004.jpg differ
diff --git a/examples/fast_rcnn/000004_boxes.mat b/examples/fast_rcnn/000004_boxes.mat
new file mode 100644
index 00000000..c7a6017c
Binary files /dev/null and b/examples/fast_rcnn/000004_boxes.mat differ
diff --git a/examples/fast_rcnn/README.md b/examples/fast_rcnn/README.md
new file mode 100644
index 00000000..f12abb14
--- /dev/null
+++ b/examples/fast_rcnn/README.md
@@ -0,0 +1,30 @@
+# Fast-RCNN demo
+
+This folder contains an example implementation of Fast-RCNN [1] in
+MatConvNet. The example trains and test on the PASCAL VOC 2007 data.
+
+There are three entry-point scripts:
+
+* `fast_rcnn_demo.m`: runs the original Caffe model imported in MatConvNet.
+* `fast_rcnn_train.m`: trains a new model from scratch, using pre-computed proposals.
+* `fast_rcnn_evaluate.m`: evaluates the trained model.
+
+Note that the code does not ship with a proposal generation method, so
+proposals must be precomputed (using e.g. edge boxes or selective
+search windows).
+
+The `fast_rcnn_demo.m` code should run out of the box, downloading the
+model as needed.
+
+To test the training code using the first GPU on your system, use
+something like:
+
+    run matlab/vl_setupnn
+    addpath examples/fast_rcnn
+    fast_rcnn_train('train',struct('gpus',1)) ;
+    fast_rcnn_evaluate('gpu',1) ;
+
+## References
+
+1.  *Fast R-CNN*, R. Girshick, International Conference on Computer
+    Vision (ICCV), 2015.
diff --git a/examples/fast_rcnn/bbox_functions/bbox_clip.m b/examples/fast_rcnn/bbox_functions/bbox_clip.m
new file mode 100644
index 00000000..1961bc02
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_clip.m
@@ -0,0 +1,12 @@
+function boxes = bbox_clip(boxes, im_size)
+% bbox_clip Clip boxes to image boundaries.
+% 
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+boxes(:,1) = max(min(boxes(:,1),im_size(2)),1);
+boxes(:,2) = max(min(boxes(:,2),im_size(1)),1);
+boxes(:,3) = max(min(boxes(:,3),im_size(2)),1);
+boxes(:,4) = max(min(boxes(:,4),im_size(1)),1);
diff --git a/examples/fast_rcnn/bbox_functions/bbox_draw.m b/examples/fast_rcnn/bbox_functions/bbox_draw.m
new file mode 100644
index 00000000..21ad3a87
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_draw.m
@@ -0,0 +1,62 @@
+function im = bbox_draw(im,boxes,c,t)
+
+% copied from Ross Girshick
+% Fast R-CNN
+% Copyright (c) 2015 Microsoft
+% Licensed under The MIT License [see LICENSE for details]
+% Written by Ross Girshick
+% --------------------------------------------------------
+% source: https://github.com/rbgirshick/fast-rcnn/blob/master/matlab/showboxes.m
+%
+%
+% Fast R-CNN
+% 
+% Copyright (c) Microsoft Corporation
+% 
+% All rights reserved.
+% 
+% MIT License
+% 
+% Permission is hereby granted, free of charge, to any person obtaining a
+% copy of this software and associated documentation files (the "Software"),
+% to deal in the Software without restriction, including without limitation
+% the rights to use, copy, modify, merge, publish, distribute, sublicense,
+% and/or sell copies of the Software, and to permit persons to whom the
+% Software is furnished to do so, subject to the following conditions:
+% 
+% The above copyright notice and this permission notice shall be included
+% in all copies or substantial portions of the Software.
+% 
+% THE SOFTWARE IS PROVIDED *AS IS*, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+% THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+% OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
+% ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+% OTHER DEALINGS IN THE SOFTWARE.
+
+image(im);
+axis image;
+axis off;
+set(gcf, 'Color', 'white');
+
+if nargin<3
+  c = 'r';
+  t = 2;
+end
+
+s = '-';
+if ~isempty(boxes)
+    x1 = boxes(:, 1);
+    y1 = boxes(:, 2);
+    x2 = boxes(:, 3);
+    y2 = boxes(:, 4);
+    line([x1 x1 x2 x2 x1]', [y1 y2 y2 y1 y1]', ...
+        'color', c, 'linewidth', t, 'linestyle', s);
+    for i = 1:size(boxes, 1)
+        text(double(x1(i)), double(y1(i)) - 2, ...
+            sprintf('%.4f', boxes(i, end)), ...
+            'backgroundcolor', 'b', 'color', 'w', 'FontSize', 10);
+    end
+end
+end
\ No newline at end of file
diff --git a/examples/fast_rcnn/bbox_functions/bbox_nms.m b/examples/fast_rcnn/bbox_functions/bbox_nms.m
new file mode 100644
index 00000000..6c3047ac
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_nms.m
@@ -0,0 +1,76 @@
+function pick = bbox_nms(boxes, overlap)
+% top = nms(boxes, overlap)
+% Non-maximum suppression. (FAST VERSION)
+% Greedily select high-scoring detections and skip detections
+% that are significantly covered by a previously selected
+% detection.
+%
+% NOTE: This is adapted from Pedro Felzenszwalb's version (nms.m),
+% but an inner loop has been eliminated to significantly speed it
+% up in the case of a large number of boxes
+
+% Copyright (C) 2011-12 by Tomasz Malisiewicz
+% All rights reserved.
+%
+% This file is part of the Exemplar-SVM library and is made
+% available under the terms of the MIT license (see COPYING file).
+% Project homepage: https://github.com/quantombone/exemplarsvm
+%
+% Copyright (C) 2011-12 by Tomasz Malisiewicz
+% 
+% Permission is hereby granted, free of charge, to any person obtaining a copy
+% of this software and associated documentation files (the "Software"), to deal
+% in the Software without restriction, including without limitation the rights
+% to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+% copies of the Software, and to permit persons to whom the Software is
+% furnished to do so, subject to the following conditions:
+% 
+% The above copyright notice and this permission notice shall be included in
+% all copies or substantial portions of the Software.
+% 
+% THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+% IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+% FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+% AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+% LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+% OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+% THE SOFTWARE.
+
+if isempty(boxes)
+  pick = [];
+  return;
+end
+
+x1 = boxes(:,1);
+y1 = boxes(:,2);
+x2 = boxes(:,3);
+y2 = boxes(:,4);
+s = boxes(:,end);
+
+area = (x2-x1+1) .* (y2-y1+1);
+[vals, I] = sort(s);
+
+pick = s*0;
+counter = 1;
+while ~isempty(I)
+  last = length(I);
+  i = I(last);
+  pick(counter) = i;
+  counter = counter + 1;
+
+  xx1 = max(x1(i), x1(I(1:last-1)));
+  yy1 = max(y1(i), y1(I(1:last-1)));
+  xx2 = min(x2(i), x2(I(1:last-1)));
+  yy2 = min(y2(i), y2(I(1:last-1)));
+
+  w = max(0.0, xx2-xx1+1);
+  h = max(0.0, yy2-yy1+1);
+
+  inter = w.*h;
+  o = inter ./ (area(i) + area(I(1:last-1)) - inter);
+
+  I = I(find(o<=overlap));
+end
+
+pick = pick(1:(counter-1));
+
diff --git a/examples/fast_rcnn/bbox_functions/bbox_overlap.m b/examples/fast_rcnn/bbox_functions/bbox_overlap.m
new file mode 100644
index 00000000..ea95695d
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_overlap.m
@@ -0,0 +1,38 @@
+function overlaps = bbox_overlap(boxes1,boxes2)
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+x11 = boxes1(:,1);
+y11 = boxes1(:,2);
+x12 = boxes1(:,3);
+y12 = boxes1(:,4);
+
+x21 = boxes2(:,1);
+y21 = boxes2(:,2);
+x22 = boxes2(:,3);
+y22 = boxes2(:,4);
+
+N1 = size(boxes1,1);
+N2 = size(boxes2,1);
+
+area1 = (x12-x11+1) .* (y12-y11+1);
+area2 = (x22-x21+1) .* (y22-y21+1);
+
+overlaps = zeros(N1,N2);
+
+for i=1:N1
+
+  xx1 = max(x11(i), x21);
+  yy1 = max(y11(i), y21);
+  xx2 = min(x12(i), x22);
+  yy2 = min(y12(i), y22);
+
+  w = max(0.0, xx2-xx1+1);
+  h = max(0.0, yy2-yy1+1);
+
+  inter = w.*h;
+  overlaps(i,:) = inter ./ (area1(i) + area2 - inter);
+end
+
diff --git a/examples/fast_rcnn/bbox_functions/bbox_remove_duplicates.m b/examples/fast_rcnn/bbox_functions/bbox_remove_duplicates.m
new file mode 100644
index 00000000..c68fa920
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_remove_duplicates.m
@@ -0,0 +1,21 @@
+function bboxeso = bbox_remove_duplicates(bboxes, minSize, maxNum)
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+bboxeso = cell(size(bboxes));
+for i=1:numel(bboxes)
+  bbox = bboxes{i};
+  % remove small bbox
+  isGood = (bbox(:,3)>=bbox(:,1)-1+minSize) & (bbox(:,4)>=bbox(:,2)-1+minSize);
+  bbox = bbox(isGood,:);
+  % remove duplicate ones
+  [dummy, uniqueIdx] = unique(bbox, 'rows', 'first');
+  uniqueIdx = sort(uniqueIdx);
+  bbox = bbox(uniqueIdx,:);
+  % limit number for training
+  nB = min(size(bbox,1),maxNum);
+
+  bboxeso{i} = bbox(1:nB,:);
+end
diff --git a/examples/fast_rcnn/bbox_functions/bbox_scale.m b/examples/fast_rcnn/bbox_functions/bbox_scale.m
new file mode 100644
index 00000000..8eb36b41
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_scale.m
@@ -0,0 +1,15 @@
+function boxOut = bbox_scale2(boxIn,scale,szOut)
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if isempty(boxIn), boxOut = []; return; end
+
+boxOut = scale * (boxIn-1) + 1;
+
+boxOut = [max(1,round(boxOut(:,1))),...
+  max(1,round(boxOut(:,2))),...
+  min(szOut(1),round(boxOut(:,3))),...
+  min(szOut(2),round(boxOut(:,4)))];
diff --git a/examples/fast_rcnn/bbox_functions/bbox_transform.m b/examples/fast_rcnn/bbox_functions/bbox_transform.m
new file mode 100644
index 00000000..117e3e8d
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_transform.m
@@ -0,0 +1,23 @@
+function targets = bbox_transform(ex_rois, gt_rois)
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+ex_widths = ex_rois(:, 3) - ex_rois(:, 1) + 1.0 ;
+ex_heights = ex_rois(:, 4) - ex_rois(:, 2) + 1.0 ;
+ex_ctr_x = ex_rois(:, 1) + 0.5 * ex_widths ;
+ex_ctr_y = ex_rois(:, 2) + 0.5 * ex_heights ;
+
+gt_widths = gt_rois(:, 3) - gt_rois(:, 1) + 1.0 ;
+gt_heights = gt_rois(:, 4) - gt_rois(:, 2) + 1.0 ;
+gt_ctr_x = gt_rois(:, 1) + 0.5 * gt_widths ;
+gt_ctr_y = gt_rois(:, 2) + 0.5 * gt_heights ;
+
+targets_dx = (gt_ctr_x - ex_ctr_x) ./ ex_widths ;
+targets_dy = (gt_ctr_y - ex_ctr_y) ./ ex_heights ;
+targets_dw = log(gt_widths ./ ex_widths) ;
+targets_dh = log(gt_heights ./ ex_heights) ;
+
+targets = [targets_dx, targets_dy, targets_dw, targets_dh] ;
\ No newline at end of file
diff --git a/examples/fast_rcnn/bbox_functions/bbox_transform_inv.m b/examples/fast_rcnn/bbox_functions/bbox_transform_inv.m
new file mode 100644
index 00000000..3aa6b14b
--- /dev/null
+++ b/examples/fast_rcnn/bbox_functions/bbox_transform_inv.m
@@ -0,0 +1,33 @@
+function pred_boxes = bbox_transform_inv(boxes, deltas)
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if isempty(boxes), return; end
+
+widths  = boxes(:,3) - boxes(:,1);
+heights = boxes(:,4) - boxes(:,2);
+ctr_x = boxes(:,1) + 0.5 * widths;
+ctr_y = boxes(:,2) + 0.5 * heights;
+
+dx = deltas(:,1);
+dy = deltas(:,2);
+dw = deltas(:,3);
+dh = deltas(:,4);
+
+pred_ctr_x = dx .* widths + ctr_x;
+pred_ctr_y = dy .* heights + ctr_y;
+pred_w = exp(dw) .* widths;
+pred_h = exp(dh) .* heights;
+
+pred_boxes = zeros(size(deltas), 'like', deltas);
+% x1
+pred_boxes(:, 1) = pred_ctr_x - 0.5 * pred_w;
+% y1
+pred_boxes(:, 2) = pred_ctr_y - 0.5 * pred_h;
+% x2
+pred_boxes(:, 3) = pred_ctr_x + 0.5 * pred_w;
+% y2
+pred_boxes(:, 4) = pred_ctr_y + 0.5 * pred_h;
diff --git a/examples/fast_rcnn/datasets/add_bboxreg_targets.m b/examples/fast_rcnn/datasets/add_bboxreg_targets.m
new file mode 100644
index 00000000..ab5d55e5
--- /dev/null
+++ b/examples/fast_rcnn/datasets/add_bboxreg_targets.m
@@ -0,0 +1,86 @@
+function imdb = add_bboxreg_targets(imdb)
+% add bbox regression targets
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+bgid = numel(imdb.classes.name) + 1;
+imdb.boxes.ptarget = cell(numel(imdb.images.name),1);
+
+count = 1;
+% add targets
+for i=1:numel(imdb.images.name)
+
+  targets = zeros(numel(imdb.boxes.plabel{i}),4);
+  pos = (imdb.boxes.plabel{i}>0 & imdb.boxes.plabel{i}<bgid);
+  if isempty(pos)
+    fprintf('no pos found (%d)\n',count);
+    count = count + 1;
+    assert(imdb.images.set(i)==3);
+    continue;
+  end
+
+  ex_rois = imdb.boxes.pbox{i}(pos,:) ;
+  gt_rois = imdb.boxes.gtbox{i}(imdb.boxes.pgtidx{i}(pos),:) ;
+
+  targets(pos,:) = bbox_transform(ex_rois, gt_rois);
+
+  imdb.boxes.ptarget{i} = targets;
+end
+ncls = numel(imdb.classes.name);
+
+% compute means and stddevs
+if ~isfield(imdb.boxes,'bboxMeanStd') || isempty(imdb.boxes.bboxMeanStd)
+
+  sums = zeros(ncls,4);
+  squared_sums = zeros(ncls,4);
+  class_counts = zeros(ncls,1) + eps;
+
+  for i=1:numel(imdb.boxes.ptarget)
+    if imdb.images.set(i)<3
+      pos =  (imdb.boxes.plabel{i}>0) & (imdb.boxes.plabel{i}<=ncls) ;
+      labels = imdb.boxes.plabel{i}(pos);
+      targets = imdb.boxes.ptarget{i}(pos,:);
+      for c=1:ncls
+        cls_inds = (labels==c);
+        if sum(cls_inds)>0
+          class_counts(c) = class_counts(c) + sum(cls_inds);
+          sums(c,:) = sums(c,:) + sum(targets(cls_inds,:));
+          squared_sums(c,:) = squared_sums(c,:) + sum(targets(cls_inds,:).^2);
+        end
+      end
+    end
+  end
+  means = bsxfun(@rdivide,sums,class_counts);
+  stds = sqrt(bsxfun(@rdivide,squared_sums,class_counts) - means.^2);
+
+  imdb.boxes.bboxMeanStd{1} = means;
+  imdb.boxes.bboxMeanStd{2} = stds;
+  display('bbox target means:');
+  display(means);
+  display('bbox target stddevs:');
+  display(stds);
+else
+  means = imdb.boxes.bboxMeanStd{1} ;
+  stds = imdb.boxes.bboxMeanStd{2};
+end
+
+% normalize targets
+for i=1:numel(imdb.boxes.ptarget)
+%   if imdb.images.set(i)<3
+    pos =  (imdb.boxes.plabel{i}>0) & (imdb.boxes.plabel{i}<=ncls) ;
+    labels = imdb.boxes.plabel{i}(pos);
+    targets = imdb.boxes.ptarget{i}(pos,:);
+    for c=1:ncls
+      cls_inds = (labels==c);
+      if sum(cls_inds)>0
+        targets(cls_inds,:) = bsxfun(@minus,targets(cls_inds,:),means(c,:));
+        targets(cls_inds,:) = bsxfun(@rdivide,targets(cls_inds,:), stds(c,:));
+      end
+    end
+    imdb.boxes.ptarget{i}(pos,:) = targets;
+%   end
+end
diff --git a/examples/fast_rcnn/datasets/attach_proposals.m b/examples/fast_rcnn/datasets/attach_proposals.m
new file mode 100644
index 00000000..f7e72372
--- /dev/null
+++ b/examples/fast_rcnn/datasets/attach_proposals.m
@@ -0,0 +1,96 @@
+function imdb = attach_proposals(imdb,boxes,fgThresh,bgThreshHi,bgThreshLo)
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+% gtboxes = imdb.images.gtboxes;
+% imdb.images = rmfield(imdb.images,'gtboxes');
+
+if numel(boxes)~=numel(imdb.images.name)
+  error('Wrong number of boxes');
+end
+
+minSize = 20;
+maxNum = inf;
+visualize = false ;
+
+boxes = bbox_remove_duplicates(boxes, minSize, maxNum);
+
+%% Get obj proposals.
+imdb.boxes.pbox   = cell(numel(imdb.images.name),1);
+imdb.boxes.plabel = cell(numel(imdb.images.name),1);
+imdb.boxes.piou   = cell(numel(imdb.images.name),1);
+imdb.boxes.pgtidx = cell(numel(imdb.images.name),1);
+
+bglabel = numel(imdb.classes.name) + 1;
+
+for i=1:numel(boxes)
+  gtbb = imdb.boxes.gtbox{i};
+  gtlabels = imdb.boxes.gtlabel{i};
+
+  if imdb.images.set(i)<3
+    boxes{i} = [boxes{i};gtbb];
+  end
+
+  pbox = boxes{i};
+
+  if size(pbox,2)~=4
+    error('wrong box dim');
+  end
+
+  plabel = zeros(size(boxes{i},1),1);
+  pgtidx = zeros(size(boxes{i},1),1);
+
+
+  iou = bbox_overlap(single(pbox),single(gtbb));
+  [max_iou,gt_assignments] = max(iou,[],2);
+  if imdb.images.set(i)<3 && all(max_iou<1)
+    error('Ground truth boxes are not added!');
+  end
+
+  piou = max_iou;
+
+  max_labels = gtlabels(gt_assignments);
+
+  % positive and negative boxes
+  pos = (max_iou>=fgThresh);
+  neg = (max_iou>=bgThreshLo & max_iou<bgThreshHi);
+
+  if visualize
+    [so,si] = max(max_iou);
+    im = imread([imdb.imageDir, filesep, imdb.images.name{i}]);
+    [h,w,~] = size(im);
+    assert(all(pbox(:,3)<=w) && all(pbox(:,4)<=h));
+    for j=1:size(pbox,1)
+      if max_iou(j)>=0.5
+        bbox_draw(im,pbox(j,:),'g',1);
+      elseif max_iou(j)>=0.1 &&  max_iou(j)<0.5
+        bbox_draw(im,pbox(j,:),'r',1);
+      else
+        bbox_draw(im,pbox(j,:),'b',1);
+      end
+      pause;
+    end
+  end
+
+  % Assign labels to box proposals.
+  plabel(pos) = max_labels(pos);
+  pgtidx(pos) = gt_assignments(pos);
+  plabel(neg) = bglabel;
+
+  if imdb.images.set(i)~=3
+    keep = plabel>0;
+    plabel = plabel(keep);
+    pgtidx = pgtidx(keep);
+    pbox = pbox(keep,:);
+    piou = piou(keep);
+  end
+
+  imdb.boxes.pbox{i} = pbox;
+  imdb.boxes.plabel{i} = plabel;
+  imdb.boxes.pgtidx{i} = pgtidx;
+  imdb.boxes.piou{i} = piou;
+end
diff --git a/examples/fast_rcnn/datasets/cnn_setup_data_voc07.m b/examples/fast_rcnn/datasets/cnn_setup_data_voc07.m
new file mode 100644
index 00000000..639b20c8
--- /dev/null
+++ b/examples/fast_rcnn/datasets/cnn_setup_data_voc07.m
@@ -0,0 +1,145 @@
+function imdb = cnn_setup_data_voc07(varargin)
+%CNN_VOC07_SETUP_DATA  Download Initialize PASCAL VOC 2007 data
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+opts.dataDir = fullfile('data') ;
+opts.useTest = true ;
+opts.useDifficult = true ;
+opts.addFlipped = true ;
+opts = vl_argparse(opts, varargin) ;
+
+% -------------------------------------------------------------------------
+%                                                  Load categories metadata
+% -------------------------------------------------------------------------
+
+if ~exist(opts.dataDir, 'dir')
+  mkdir(opts.dataDir) ;
+end
+
+% Download VOC Devkit and data
+if ~exist(fullfile(opts.dataDir,'VOCdevkit'),'dir')
+  files = {'VOCtest_06-Nov-2007.tar',...
+           'VOCtrainval_06-Nov-2007.tar',...
+           'VOCdevkit_08-Jun-2007.tar'} ;
+  for i=1:numel(files)
+    if ~exist(fullfile(opts.dataDir, files{i}), 'file')
+      outPath = fullfile(opts.dataDir,files{i}) ;
+      url = sprintf('http://host.robots.ox.ac.uk/pascal/VOC/voc2007/%s',files{i}) ;
+      fprintf('Downloading %s to %s\n', url, outPath) ;
+      urlwrite(url,outPath) ;
+      untar(outPath,opts.dataDir);
+    end
+  end
+end
+addpath(fullfile(opts.dataDir, 'VOCdevkit', 'VOCcode'));
+
+% Initialize VOC options
+VOCinit ;
+VOCopts.dataset = 'VOC2007';
+VOCopts.imgsetpath = fullfile(opts.dataDir, 'VOCdevkit', 'VOC2007', 'ImageSets', 'Main', '%s.txt');
+VOCopts.annopath  = fullfile(opts.dataDir, 'VOCdevkit', 'VOC2007' ,'Annotations', '%s.xml');
+
+imdb.classes.name = VOCopts.classes ;
+imdb.classes.description = VOCopts.classes ;
+imdb.imageDir = fullfile(opts.dataDir, 'VOCdevkit', 'VOC2007' ,'JPEGImages') ;
+
+% -------------------------------------------------------------------------
+%                                                                    Images
+% -------------------------------------------------------------------------
+
+k = 0 ;
+for thisSet = {'train', 'val', 'test'}
+  thisSet = char(thisSet) ;
+
+  fprintf('Loading PASCAL VOC %s set\n', thisSet) ;
+  VOCopts.testset = thisSet ;
+
+  [gtids,t]=textread(sprintf(VOCopts.imgsetpath,thisSet),'%s %d');
+
+  k = k + 1 ;
+  imdb_.images.name{k} = strcat(gtids,'.jpg');
+  imdb_.images.set{k}  = k * ones(size(imdb_.images.name{k}));
+  imdb_.images.size{k} = zeros(numel(imdb_.images.name{k}),2);
+  imdb_.boxes.gtbox{k} = cell(size(imdb_.images.name{k}));
+  imdb_.boxes.gtlabel{k} = cell(size(imdb_.images.name{k}));
+
+  % Load ground truth objects
+  for i=1:length(gtids)
+    % Read annotation.
+    rec=PASreadrecord(sprintf(VOCopts.annopath,gtids{i}));
+
+    imdb_.images.size{k}(i,:) = rec.imgsize(1:2);
+
+    % extract objects of class
+    BB = vertcat(rec.objects(:).bbox);
+    diff = vertcat(rec.objects(:).difficult);
+    if opts.useDifficult
+      diff = 0 * diff ;
+    end
+    [~,label]=ismember({rec.objects(:).class},VOCopts.classes);
+
+    if ~isempty(BB)
+      BB = BB(~diff,:);
+      imdb_.boxes.gtbox{k}{i} = BB;
+      assert(all(BB(:,3)<=rec.imgsize(1)));
+      assert(all(BB(:,4)<=rec.imgsize(2)));
+      imdb_.boxes.gtlabel{k}{i} = label(~diff)';
+    end
+  end
+end
+
+imdb.images.name = vertcat(imdb_.images.name{:}) ;
+imdb.images.size = vertcat(imdb_.images.size{:}) ;
+imdb.images.set  = vertcat(imdb_.images.set{:}) ;
+imdb.boxes.gtbox = vertcat(imdb_.boxes.gtbox{:}) ;
+imdb.boxes.gtlabel = vertcat(imdb_.boxes.gtlabel{:}) ;
+
+% -------------------------------------------------------------------------
+%                                                                   Flipped
+% -------------------------------------------------------------------------
+
+trainval = (imdb.images.set==1 | imdb.images.set==2);
+imdb.boxes.flip = zeros(size(imdb.images.name));
+
+% Add flipped
+if opts.addFlipped
+  trainval = (imdb.images.set <= 2) ;
+  imdb.images.name = vertcat(imdb.images.name, imdb.images.name(trainval)) ;
+  imdb.images.set  = vertcat(imdb.images.set, imdb.images.set(trainval)) ;
+  imdb.images.size  = vertcat(imdb.images.size, imdb.images.size(trainval,:)) ;
+
+  imdb.boxes.gtbox = vertcat(imdb.boxes.gtbox , imdb.boxes.gtbox(trainval)) ;
+  imdb.boxes.gtlabel = vertcat(imdb.boxes.gtlabel, imdb.boxes.gtlabel(trainval)) ;
+  imdb.boxes.flip = vertcat(imdb.boxes.flip, ones(sum(trainval),1)) ;
+
+  for i=1:numel(imdb.boxes.gtbox)
+    if imdb.boxes.flip(i)
+      imf = imfinfo([imdb.imageDir filesep imdb.images.name{i}]);
+      gtbox = imdb.boxes.gtbox{i} ;
+
+      assert(all(gtbox(:,1)<=imf.Width));
+      assert(all(gtbox(:,3)<=imf.Width));
+
+      gtbox(:,1) = imf.Width - gtbox(:,3) + 1;
+      gtbox(:,3) = imf.Width - imdb.boxes.gtbox{i}(:,1) + 1;
+      imdb.boxes.gtbox{i} = gtbox;
+    end
+  end
+end
+
+% -------------------------------------------------------------------------
+%                                                            Postprocessing
+% -------------------------------------------------------------------------
+
+[~,si] = sort(imdb.images.name) ;
+imdb.images.name = imdb.images.name(si) ;
+imdb.images.set = imdb.images.set(si) ;
+imdb.images.size = imdb.images.size(si,:) ;
+imdb.boxes.gtbox = imdb.boxes.gtbox(si)' ;
+imdb.boxes.gtlabel = imdb.boxes.gtlabel(si) ;
+imdb.boxes.flip = imdb.boxes.flip(si) ;
diff --git a/examples/fast_rcnn/datasets/cnn_setup_data_voc07_ssw.m b/examples/fast_rcnn/datasets/cnn_setup_data_voc07_ssw.m
new file mode 100644
index 00000000..05736bd8
--- /dev/null
+++ b/examples/fast_rcnn/datasets/cnn_setup_data_voc07_ssw.m
@@ -0,0 +1,102 @@
+function imdb = cnn_setup_data_voc07_ssw(varargin)
+%CNN_SETUP_DATE_VOC07_SSW  Setup PASCAL VOC 2007 data with precomputed SSW proposals
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+opts.sswDir = fullfile('data','SSW') ;
+opts.dataDir = 'data' ;
+opts.addFlipped = true ;
+opts.useDifficult = true ;
+opts.fgThresh = 0.5 ;
+opts.bgThreshHi = 0.5 ;
+opts.bgThreshLo = 0.1 ;
+opts = vl_argparse(opts, varargin) ;
+
+%% Get selective search windows
+files = {...
+  'SelectiveSearchVOC2007trainval.mat', ...
+  'SelectiveSearchVOC2007test.mat'} ;
+
+if ~exist(opts.sswDir, 'dir')
+  mkdir(opts.sswDir) ;
+end
+
+for i=1:numel(files)
+  outPath = fullfile(opts.sswDir, files{i}) ;
+  if ~exist(outPath, 'file')
+    url = sprintf('http://koen.me/research/downloads/%s',files{i}) ;
+    fprintf('Downloading %s to %s\n', url, outPath) ;
+    urlwrite(url,outPath) ;
+  end
+end
+
+%% Get image names and gt boxes.
+imdb = cnn_setup_data_voc07(...
+  'dataDir', opts.dataDir, ...
+  'useDifficult', opts.useDifficult, ...
+  'addFlipped', opts.addFlipped) ;
+
+%% Load precomputed object proposals
+train = load(fullfile(opts.sswDir, files{1})) ;
+test = load(fullfile(opts.sswDir, files{2})) ;
+
+% Check that all proposals are correctly matched to an image in imdb
+assert(isempty(...
+  setxor(vertcat(train.images,test.images), cellfun(@(x)x(1:6),imdb.images.name,'uniformoutput',0)))) ;
+
+if opts.addFlipped
+  boxes = horzcat(train.boxes,train.boxes,test.boxes) ;
+  imnames = vertcat(train.images,train.images,test.images) ;
+else
+  boxes = horzcat(train.boxes,test.boxes) ;
+  imnames = vertcat(train.images,test.images) ;
+end
+assert(numel(boxes)==numel(imdb.images.name)) ;
+
+% Sort proposals by ascending image name, as this is also the order in imdb
+[imnames,si] = sort(imnames);
+boxes = boxes(si);
+
+% Transpose XY in proposals
+for i=1:numel(boxes)
+  boxes{i} = boxes{i}(:,[2 1 4 3]);
+end
+
+% Check boxes and find corresponding image
+for i=1:numel(imdb.images.name)
+
+  bbox = boxes{i};
+  assert(strcmp(imnames{i},imdb.images.name{i}(1:end-4)));
+  assert(all(all(bbox(:,[1 2]) <= bbox(:,[3 4])))) ;
+  assert(all(all(1 <= bbox & bsxfun(@le, bbox, imdb.images.size(i,[1 2 1 2]))))) ;
+
+  % Flip the proposals if needed
+  if imdb.boxes.flip(i)
+    imageWidth = imdb.images.size(i,1) ;
+    bbox(:,[3 1]) = imageWidth - bbox(:,[1 3]) + 1 ;
+  end
+
+  boxes{i} = bbox ;
+end
+
+imdb = attach_proposals(imdb,boxes,opts.fgThresh,opts.bgThreshHi,opts.bgThreshLo);
+imdb = add_bboxreg_targets(imdb);
+
+if 0
+  for i = 1:100
+    for c = 1:21
+      sel = find(imdb.boxes.plabel{i} == c) ;
+      if isempty(sel), continue ; end
+      im = imread(fullfile(imdb.imageDir, imdb.images.name{i})) ;
+      if imdb.boxes.flip(i), im = fliplr(im) ; end
+      pbox = imdb.boxes.pbox{i}(sel,:) ;
+      clf ; bbox_draw(im, pbox) ;
+      title(sprintf('Class %d', c)) ;
+      keyboard
+    end
+  end
+end
diff --git a/examples/fast_rcnn/fast_rcnn_demo.m b/examples/fast_rcnn/fast_rcnn_demo.m
new file mode 100644
index 00000000..14b0a2c3
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_demo.m
@@ -0,0 +1,112 @@
+function fast_rcnn_demo(varargin)
+%FAST_RCNN_DEMO  Demonstrates Fast-RCNN
+%
+% Copyright (C) 2016 Abhishek Dutta and Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+run(fullfile(fileparts(mfilename('fullpath')), ...
+  '..', '..', 'matlab', 'vl_setupnn.m')) ;
+
+addpath(fullfile(vl_rootnn,'examples','fast_rcnn','bbox_functions')) ;
+
+opts.modelPath = '' ;
+opts.classes = {'car'} ;
+opts.gpu = [] ;
+opts.confThreshold = 0.5 ;
+opts.nmsThreshold = 0.3 ;
+opts = vl_argparse(opts, varargin) ;
+
+% Load or download the Fast RCNN model
+paths = {opts.modelPath, ...
+         './fast-rcnn-vgg16-dagnn.mat', ...
+         fullfile(vl_rootnn, 'data', 'models', 'fast-rcnn-vgg16-pascal07-dagnn.mat'), ...
+         fullfile(vl_rootnn, 'data', 'models-import', 'fast-rcnn-vgg16-pascal07-dagnn.mat')} ;
+ok = min(find(cellfun(@(x)exist(x,'file'), paths))) ;
+
+if isempty(ok)
+  fprintf('Downloading the Fast RCNN model ... this may take a while\n') ;
+  opts.modelPath = fullfile(vl_rootnn, 'data', 'models', 'fast-rcnn-vgg16-pascal07-dagnn.mat') ;
+  mkdir(fileparts(opts.modelPath)) ;
+  urlwrite('http://www.vlfeat.org/matconvnet/models/fast-rcnn-vgg16-pascal07-dagnn.mat', ...
+           opts.modelPath) ;
+else
+  opts.modelPath = paths{ok} ;
+end
+
+% Load the network and put it in test mode.
+net = load(opts.modelPath) ;
+net = dagnn.DagNN.loadobj(net);
+net.mode = 'test' ;
+
+% Mark class and bounding box predictions as `precious` so they are
+% not optimized away during evaluation.
+net.vars(net.getVarIndex('cls_prob')).precious = 1 ;
+net.vars(net.getVarIndex('bbox_pred')).precious = 1 ;
+
+% Load a test image and candidate bounding boxes.
+im = single(imread('000004.jpg')) ;
+imo = im; % keep original image
+boxes = load('000004_boxes.mat') ;
+boxes = single(boxes.boxes') + 1 ;
+boxeso = boxes - 1; % keep original boxes
+
+% Resize images and boxes to a size compatible with the network.
+imageSize = size(im) ;
+fullImageSize = net.meta.normalization.imageSize(1) ...
+    / net.meta.normalization.cropSize ;
+scale = max(fullImageSize ./ imageSize(1:2)) ;
+im = imresize(im, scale, ...
+              net.meta.normalization.interpolation, ...
+              'antialiasing', false) ;
+boxes = bsxfun(@times, boxes - 1, scale) + 1 ;
+
+% Remove the average color from the input image.
+imNorm = bsxfun(@minus, im, net.meta.normalization.averageImage) ;
+
+% Convert boxes into ROIs by prepending the image index. There is only
+% one image in this batch.
+rois = [ones(1,size(boxes,2)) ; boxes] ;
+
+% Evaluate network either on CPU or GPU.
+if numel(opts.gpu) > 0
+  gpuDevice(opts.gpu) ;
+  imNorm = gpuArray(imNorm) ;
+  rois = gpuArray(rois) ;
+  net.move('gpu') ;
+end
+
+net.conserveMemory = false ;
+net.eval({'data', imNorm, 'rois', rois});
+
+% Extract class probabilities and  bounding box refinements
+probs = squeeze(gather(net.vars(net.getVarIndex('cls_prob')).value)) ;
+deltas = squeeze(gather(net.vars(net.getVarIndex('bbox_pred')).value)) ;
+
+% Visualize results for one class at a time
+for i = 1:numel(opts.classes)
+  c = find(strcmp(opts.classes{i}, net.meta.classes.name)) ;
+  cprobs = probs(c,:) ;
+  cdeltas = deltas(4*(c-1)+(1:4),:)' ;
+  cboxes = bbox_transform_inv(boxeso', cdeltas);
+  cls_dets = [cboxes cprobs'] ;
+
+  keep = bbox_nms(cls_dets, opts.nmsThreshold) ;
+  cls_dets = cls_dets(keep, :) ;
+
+  sel_boxes = find(cls_dets(:,end) >= opts.confThreshold) ;
+
+  imo = bbox_draw(imo/255,cls_dets(sel_boxes,:));
+  title(sprintf('Detections for class ''%s''', opts.classes{i})) ;
+
+  fprintf('Detections for category ''%s'':\n', opts.classes{i});
+  for j=1:size(sel_boxes,1)
+    bbox_id = sel_boxes(j,1);
+    fprintf('\t(%.1f,%.1f)\t(%.1f,%.1f)\tprobability=%.6f\n', ...
+            cls_dets(bbox_id,1), cls_dets(bbox_id,2), ...
+            cls_dets(bbox_id,3), cls_dets(bbox_id,4), ...
+            cls_dets(bbox_id,end));
+  end
+end
diff --git a/examples/fast_rcnn/fast_rcnn_eval_get_batch.m b/examples/fast_rcnn/fast_rcnn_eval_get_batch.m
new file mode 100644
index 00000000..72bbc4d6
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_eval_get_batch.m
@@ -0,0 +1,123 @@
+function [imo,rois] = fast_rcnn_eval_get_batch(images, imdb, batch, opts)
+% FAST_RCNN_GET_BATCH_EVAL Load, preprocess, and pack images for CNN
+% evaluation
+
+% opts.numFgRoisPerImg = 128;
+% opts.numRoisPerImg = 64;
+% opts.maxScale = 1000;
+% opts.bgLabel = 21;
+% opts.visualize = 1;
+% opts.scale = 600;
+% opts.interpolation = 'bicubic';
+% opts.averageImage = [];
+% opts.numThreads = 2;
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if isempty(images)
+  imo = [] ;
+  rois = [] ;
+  return ;
+end
+
+% fetch is true if images is a list of filenames (instead of
+% a cell array of images)
+fetch = ischar(images{1}) ;
+
+% prefetch is used to load images in a separate thread
+prefetch = fetch & opts.prefetch ;
+
+if prefetch
+  vl_imreadjpeg(images, 'numThreads',opts.numThreads,'prefetch') ;
+  imo = [] ;
+  rois = [] ;
+  return ;
+end
+
+if fetch
+  ims = vl_imreadjpeg(images,'numThreads',opts.numThreads) ;
+else
+  ims = images ;
+end
+
+
+
+imre = cell(1,numel(batch));
+maxW = 0;
+maxH = 0;
+
+pboxes  = cell(1,numel(batch));
+
+% get fg and bg rois
+for b=1:numel(batch)
+  pbox   = imdb.boxes.pbox{batch(b)};
+
+  if size(pbox,2)~=4
+    error('wrong box size');
+  end
+
+  pboxes{b} = pbox;
+end
+
+% rescale images and rois
+rois = [];
+for b=1:numel(batch)
+  imSize = size(ims{b});
+
+  h = imSize(1);
+  w = imSize(2);
+
+  factor = max(opts.scale(1)/h,opts.scale(1)/w);
+
+  if any([h*factor,w*factor]>opts.maxScale)
+    factor = min(opts.maxScale/h,opts.maxScale/w);
+  end
+
+  if abs(factor-1)>1e-3
+    imre{b} = imresize(ims{b},factor,'Method',opts.interpolation,...
+        'antialiasing', false);
+  else
+    imre{b} = ims{b};
+  end
+
+  if imdb.boxes.flip(batch(b))
+    im = imre{b};
+    imre{b} = im(:,end:-1:1,:);
+  end
+
+  imreSize = size(imre{b});
+
+  maxH = max(imreSize(1),maxH);
+  maxW = max(imreSize(2),maxW);
+
+  % adapt bounding boxes into new coord
+  bbox = pboxes{b};
+  if any(bbox(:)<=0)
+    error('bbox error');
+  end
+
+  nB = size(bbox,1);
+  tbbox = bbox_scale(bbox,factor,[imreSize(2) imreSize(1)]);
+  if any(tbbox(:)<=0)
+    error('tbbox error');
+  end
+
+  rois = [rois [b*ones(1,nB); tbbox' ] ];
+end
+
+% rois = single(rois);
+imo = zeros(maxH,maxW,size(imre{1},3),numel(batch),'single');
+for b=1:numel(batch)
+  if ~isempty(opts.averageImage)
+    imre{b} = single(bsxfun(@minus,imre{b},opts.averageImage));
+  end
+  sz = size(imre{b});
+  imo(1:sz(1),1:sz(2),:,b) = single(imre{b});
+end
+
+
+
diff --git a/examples/fast_rcnn/fast_rcnn_evaluate.m b/examples/fast_rcnn/fast_rcnn_evaluate.m
new file mode 100644
index 00000000..c3452777
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_evaluate.m
@@ -0,0 +1,219 @@
+function [aps, speed] = fast_rcnn_evaluate(varargin)
+%FAST_RCNN_EVALUATE  Evaluate a trained Fast-RCNN model on PASCAL VOC 2007
+
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+run(fullfile(fileparts(mfilename('fullpath')), ...
+  '..', '..', 'matlab', 'vl_setupnn.m')) ;
+
+addpath(fullfile(vl_rootnn, 'data', 'VOCdevkit', 'VOCcode'));
+addpath(genpath(fullfile(vl_rootnn, 'examples', 'fast_rcnn')));
+
+opts.dataDir   = fullfile(vl_rootnn, 'data') ;
+[opts, varargin] = vl_argparse(opts, varargin) ;
+
+opts.sswDir    = fullfile(opts.dataDir, 'SSW');
+opts.expDir    = fullfile(opts.dataDir, 'fast-rcnn-vgg16-pascal07') ;
+[opts, varargin] = vl_argparse(opts, varargin) ;
+
+opts.imdbPath  = fullfile(opts.expDir, 'imdb.mat');
+opts.modelPath = fullfile(opts.expDir, 'net-deployed.mat') ;
+
+opts.gpu = [] ;
+opts.numFetchThreads = 1 ;
+opts.nmsThresh = 0.3 ;
+opts.maxPerImage = 100 ;
+opts = vl_argparse(opts, varargin) ;
+
+display(opts) ;
+
+if ~exist(opts.expDir,'dir')
+  mkdir(opts.expDir) ;
+end
+
+if ~isempty(opts.gpu)
+  gpuDevice(opts.gpu)
+end
+
+% -------------------------------------------------------------------------
+%                                                    Network initialization
+% -------------------------------------------------------------------------
+net = dagnn.DagNN.loadobj(load(opts.modelPath)) ;
+
+net.mode = 'test' ;
+
+if ~isempty(opts.gpu)
+  net.move('gpu') ;
+end
+
+% -------------------------------------------------------------------------
+%                                                   Database initialization
+% -------------------------------------------------------------------------
+if exist(opts.imdbPath,'file')
+  fprintf('Loading precomputed imdb...\n');
+  imdb = load(opts.imdbPath) ;
+else
+  fprintf('Obtaining dataset and imdb...\n');
+  imdb = cnn_setup_data_voc07_ssw(...
+    'dataDir',opts.dataDir,...
+    'sswDir',opts.sswDir);
+  save(opts.imdbPath,'-struct', 'imdb','-v7.3');
+end
+
+fprintf('done\n');
+
+bopts.averageImage = net.meta.normalization.averageImage;
+bopts.useGpu = numel(opts.gpu) >  0 ;
+bopts.maxScale = 1000;
+bopts.bgLabel = 21;
+bopts.visualize = 0;
+bopts.scale = 600;
+bopts.interpolation = net.meta.normalization.interpolation;
+bopts.numThreads = opts.numFetchThreads;
+
+% -------------------------------------------------------------------------
+%                                                                  Evaluate
+% -------------------------------------------------------------------------
+VOCinit;
+VOCopts.testset='test';
+
+testIdx = find(imdb.images.set == 3) ;
+cls_probs  = cell(1,numel(testIdx)) ;
+box_deltas = cell(1,numel(testIdx)) ;
+boxscores_nms = cell(numel(VOCopts.classes),numel(testIdx)) ;
+ids = cell(numel(VOCopts.classes),numel(testIdx)) ;
+
+dataVar = 'input' ;
+probVarI = net.getVarIndex('probcls') ;
+boxVarI = net.getVarIndex('predbbox') ;
+
+if isnan(probVarI)
+  dataVar = 'data' ;
+  probVarI = net.getVarIndex('cls_prob') ;
+  boxVarI = net.getVarIndex('bbox_pred') ;
+end
+
+net.vars(probVarI).precious = true ;
+net.vars(boxVarI).precious = true ;
+
+start = tic ;
+for t=1:numel(testIdx)
+  speed = t/toc(start) ;
+  fprintf('Image %d of %d (%.f HZ)\n', t, numel(testIdx), speed) ;
+  batch = testIdx(t);
+  inputs = getBatch(bopts, imdb, batch);
+  inputs{1} = dataVar ;
+  net.eval(inputs) ;
+
+  cls_probs{t} = squeeze(gather(net.vars(probVarI).value)) ;
+  box_deltas{t} = squeeze(gather(net.vars(boxVarI).value)) ;
+end
+
+% heuristic: keep an average of 40 detections per class per images prior
+% to NMS
+max_per_set = 40 * numel(testIdx);
+
+% detection thresold for each class (this is adaptively set based on the
+% max_per_set constraint)
+cls_thresholds = zeros(1,numel(VOCopts.classes));
+cls_probs_concat = horzcat(cls_probs{:});
+
+for c = 1:numel(VOCopts.classes)
+  q = find(strcmp(VOCopts.classes{c}, net.meta.classes.name)) ;
+  so = sort(cls_probs_concat(q,:),'descend');
+  cls_thresholds(q) = so(min(max_per_set,numel(so)));
+  fprintf('Applying NMS for %s\n',VOCopts.classes{c});
+
+  for t=1:numel(testIdx)
+    si = find(cls_probs{t}(q,:) >= cls_thresholds(q)) ;
+    if isempty(si), continue; end
+    cls_prob = cls_probs{t}(q,si)';
+    pbox = imdb.boxes.pbox{testIdx(t)}(si,:);
+
+    % back-transform bounding box corrections
+    delta = box_deltas{t}(4*(q-1)+1:4*q,si)';
+    pred_box = bbox_transform_inv(pbox, delta);
+
+    im_size = imdb.images.size(testIdx(t),[2 1]);
+    pred_box = bbox_clip(round(pred_box), im_size);
+
+    % Threshold. Heuristic: keep at most 100 detection per class per image
+    % prior to NMS.
+    boxscore = [pred_box cls_prob];
+    [~,si] = sort(boxscore(:,5),'descend');
+    boxscore = boxscore(si,:);
+    boxscore = boxscore(1:min(size(boxscore,1),opts.maxPerImage),:);
+
+    % NMS
+    pick = bbox_nms(double(boxscore),opts.nmsThresh);
+
+    boxscores_nms{c,t} = boxscore(pick,:) ;
+    ids{c,t} = repmat({imdb.images.name{testIdx(t)}(1:end-4)},numel(pick),1) ;
+
+    if 0
+      figure(1) ; clf ;
+      idx = boxscores_nms{c,t}(:,5)>0.5;
+      if sum(idx)==0, continue; end
+      bbox_draw(imread(fullfile(imdb.imageDir,imdb.images.name{testIdx(t)})), ...
+                boxscores_nms{c,t}(idx,:)) ;
+      title(net.meta.classes.name{q}) ;
+      drawnow ;
+      pause;
+      %keyboard
+    end
+  end
+end
+
+
+%% PASCAL VOC evaluation
+VOCdevkitPath = fullfile(vl_rootnn,'data','VOCdevkit');
+aps = zeros(numel(VOCopts.classes),1);
+
+% fix voc folders
+VOCopts.imgsetpath = fullfile(VOCdevkitPath,'VOC2007','ImageSets','Main','%s.txt');
+VOCopts.annopath   = fullfile(VOCdevkitPath,'VOC2007','Annotations','%s.xml');
+VOCopts.localdir   = fullfile(VOCdevkitPath,'local','VOC2007');
+VOCopts.detrespath = fullfile(VOCdevkitPath, 'results', 'VOC2007', 'Main', ['%s_det_', VOCopts.testset, '_%s.txt']);
+
+% write det results to txt files
+for c=1:numel(VOCopts.classes)
+  fid = fopen(sprintf(VOCopts.detrespath,'comp3',VOCopts.classes{c}),'w');
+  for i=1:numel(testIdx)
+    if isempty(boxscores_nms{c,i}), continue; end
+    dets = boxscores_nms{c,i};
+    for j=1:size(dets,1)
+      fprintf(fid,'%s %.6f %d %d %d %d\n', ...
+        imdb.images.name{testIdx(i)}(1:end-4), ...
+        dets(j,5),dets(j,1:4)) ;
+    end
+  end
+  fclose(fid);
+  [rec,prec,ap] = VOCevaldet(VOCopts,'comp3',VOCopts.classes{c},0);
+  fprintf('%s ap %.1f\n',VOCopts.classes{c},100*ap);
+  aps(c) = ap;
+end
+fprintf('mean ap %.1f\n',100*mean(aps));
+
+% --------------------------------------------------------------------
+function inputs = getBatch(opts, imdb, batch)
+% --------------------------------------------------------------------
+if isempty(batch)
+  return;
+end
+
+images = strcat([imdb.imageDir filesep], imdb.images.name(batch)) ;
+opts.prefetch = (nargout == 0);
+
+[im,rois] = fast_rcnn_eval_get_batch(images, imdb, batch, opts);
+
+rois = single(rois);
+if opts.useGpu > 0
+  im = gpuArray(im) ;
+  rois = gpuArray(rois) ;
+end
+
+inputs = {'input', im, 'rois', rois} ;
diff --git a/examples/fast_rcnn/fast_rcnn_init.m b/examples/fast_rcnn/fast_rcnn_init.m
new file mode 100644
index 00000000..1c266ba3
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_init.m
@@ -0,0 +1,106 @@
+function net = fast_rcnn_init(varargin)
+%FAST_RCNN_INIT  Initialize a Fast-RCNN
+
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+opts.piecewise = 1;
+opts.modelPath = fullfile('data', 'models','imagenet-vgg-verydeep-16.mat');
+opts = vl_argparse(opts, varargin) ;
+display(opts) ;
+
+% Load an imagenet pre-trained cnn model.
+net = load(opts.modelPath);
+net = vl_simplenn_tidy(net);
+
+% Add drop-out layers.
+relu6p = find(cellfun(@(a) strcmp(a.name, 'relu6'), net.layers)==1);
+relu7p = find(cellfun(@(a) strcmp(a.name, 'relu7'), net.layers)==1);
+
+drop6 = struct('type', 'dropout', 'rate', 0.5, 'name','drop6');
+drop7 = struct('type', 'dropout', 'rate', 0.5, 'name','drop7');
+net.layers = [net.layers(1:relu6p) drop6 net.layers(relu6p+1:relu7p) drop7 net.layers(relu7p+1:end)];
+
+% Change loss for FC layers.
+nCls = 21;
+fc8p = find(cellfun(@(a) strcmp(a.name, 'fc8'), net.layers)==1);
+net.layers{fc8p}.name = 'predcls';
+net.layers{fc8p}.weights{1} = 0.01 * randn(1,1,size(net.layers{fc8p}.weights{1},3),nCls,'single');
+net.layers{fc8p}.weights{2} = zeros(1, nCls, 'single');
+
+% Skip pool5.
+pPool5 = find(cellfun(@(a) strcmp(a.name, 'pool5'), net.layers)==1);
+net.layers = net.layers([1:pPool5-1,pPool5+1:end-1]);
+
+% Convert to DagNN.
+net = dagnn.DagNN.fromSimpleNN(net, 'canonicalNames', true) ;
+
+% Add ROIPooling layer.
+vggdeep = false;
+pRelu5 = find(arrayfun(@(a) strcmp(a.name, 'relu5'), net.layers)==1);
+if isempty(pRelu5)
+  vggdeep = true;
+  pRelu5 = find(arrayfun(@(a) strcmp(a.name, 'relu5_3'), net.layers)==1);
+  if isempty(pRelu5)
+    error('Cannot find last relu before fc');
+  end
+end
+
+pFc6 = (arrayfun(@(a) strcmp(a.name, 'fc6'), net.layers)==1);
+if vggdeep
+  net.addLayer('roipool', dagnn.ROIPooling('method','max','transform',1/16,...
+    'subdivisions',[7,7],'flatten',0), ...
+    {net.layers(pRelu5).outputs{1},'rois'}, 'xRP');
+else
+  net.addLayer('roipool', dagnn.ROIPooling('method','max','transform',1/16,...
+    'subdivisions',[6,6],'flatten',0), ...
+    {net.layers(pRelu5).outputs{1},'rois'}, 'xRP');
+end
+
+pRP = (arrayfun(@(a) strcmp(a.name, 'roipool'), net.layers)==1);
+net.layers(pFc6).inputs{1} = net.layers(pRP).outputs{1};
+
+% Add softmax loss layer.
+pFc8 = (arrayfun(@(a) strcmp(a.name, 'predcls'), net.layers)==1);
+net.addLayer('losscls',dagnn.Loss(), ...
+  {net.layers(pFc8).outputs{1},'label'}, ...
+  'losscls',{});
+
+% Add bbox regression layer.
+if opts.piecewise
+  pparFc8 = (arrayfun(@(a) strcmp(a.name, 'predclsf'), net.params)==1);
+  pdrop7 = (arrayfun(@(a) strcmp(a.name, 'drop7'), net.layers)==1);
+  net.addLayer('predbbox',dagnn.Conv('size',[1 1 size(net.params(pparFc8).value,3) 84],'hasBias', true), ...
+    net.layers(pdrop7).outputs{1},'predbbox',{'predbboxf','predbboxb'});
+
+  net.params(end-1).value = 0.001 * randn(1,1,size(net.params(pparFc8).value,3),84,'single');
+  net.params(end).value = zeros(1,84,'single');
+
+  net.addLayer('lossbbox',dagnn.LossSmoothL1(), ...
+    {'predbbox','targets','instance_weights'}, ...
+    'lossbbox',{});
+end
+
+net.rebuild();
+
+% No decay for bias and set learning rate to 2
+for i=2:2:numel(net.params)
+  net.params(i).weightDecay = 0;
+  net.params(i).learningRate = 2;
+end
+
+% Change image-mean as in fast-rcnn code
+net.meta.normalization.averageImage = ...
+  reshape([122.7717 102.9801 115.9465],[1 1 3]);
+
+net.meta.normalization.interpolation = 'bilinear';
+
+net.meta.classes.name = {'aeroplane', 'bicycle', 'bird', ...
+    'boat', 'bottle', 'bus', 'car', 'cat', 'chair', 'cow', 'diningtable', ...
+    'dog', 'horse', 'motorbike', 'person', 'pottedplant', 'sheep', ...
+    'sofa', 'train', 'tvmonitor', 'background' };
+  
+net.meta.classes.description = {};
diff --git a/examples/fast_rcnn/fast_rcnn_train.m b/examples/fast_rcnn/fast_rcnn_train.m
new file mode 100644
index 00000000..921e2d41
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_train.m
@@ -0,0 +1,189 @@
+function [net, info] = fast_rcnn_train(varargin)
+%FAST_RCNN_TRAIN  Demonstrates training a Fast-RCNN detector
+
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+run(fullfile(fileparts(mfilename('fullpath')), ...
+  '..', '..', 'matlab', 'vl_setupnn.m')) ;
+addpath(fullfile(vl_rootnn,'examples','fast_rcnn','bbox_functions'));
+addpath(fullfile(vl_rootnn,'examples','fast_rcnn','datasets'));
+
+opts.dataDir   = fullfile(vl_rootnn, 'data') ;
+opts.sswDir    = fullfile(vl_rootnn, 'data', 'SSW');
+opts.expDir    = fullfile(vl_rootnn, 'data', 'fast-rcnn-vgg16-pascal07') ;
+opts.imdbPath  = fullfile(opts.expDir, 'imdb.mat');
+opts.modelPath = fullfile(opts.dataDir, 'models', ...
+  'imagenet-vgg-verydeep-16.mat') ;
+
+opts.piecewise = true;  % piecewise training (+bbox regression)
+opts.train.gpus = [] ;
+opts.train.batchSize = 2 ;
+opts.train.numSubBatches = 1 ;
+opts.train.continue = true ;
+opts.train.prefetch = false ; % does not help for two images in a batch
+opts.train.learningRate = 1e-3 / 64 * [ones(1,6) 0.1*ones(1,6)];
+opts.train.weightDecay = 0.0005 ;
+opts.train.numEpochs = 12 ;
+opts.train.derOutputs = {'losscls', 1, 'lossbbox', 1} ;
+opts.lite = false  ;
+opts.numFetchThreads = 2 ;
+
+opts = vl_argparse(opts, varargin) ;
+display(opts);
+
+opts.train.expDir = opts.expDir ;
+opts.train.numEpochs = numel(opts.train.learningRate) ;
+
+% -------------------------------------------------------------------------
+%                                                    Network initialization
+% -------------------------------------------------------------------------
+net = fast_rcnn_init(...
+  'piecewise',opts.piecewise,...
+  'modelPath',opts.modelPath);
+
+% -------------------------------------------------------------------------
+%                                                   Database initialization
+% -------------------------------------------------------------------------
+if exist(opts.imdbPath,'file') == 2
+  fprintf('Loading imdb...');
+  imdb = load(opts.imdbPath) ;
+else
+  if ~exist(opts.expDir,'dir')
+    mkdir(opts.expDir);
+  end
+  fprintf('Setting VOC2007 up, this may take a few minutes\n');
+  imdb = cnn_setup_data_voc07_ssw(...
+    'dataDir', opts.dataDir, ...
+    'sswDir', opts.sswDir, ...
+    'addFlipped', true, ...
+    'useDifficult', true) ;
+  save(opts.imdbPath,'-struct', 'imdb','-v7.3');
+  fprintf('\n');
+end
+fprintf('done\n');
+
+% --------------------------------------------------------------------
+%                                                                Train
+% --------------------------------------------------------------------
+% use train + val split to train
+imdb.images.set(imdb.images.set == 2) = 1;
+
+% minibatch options
+bopts = net.meta.normalization;
+bopts.useGpu = numel(opts.train.gpus) >  0 ;
+bopts.numFgRoisPerImg = 16;
+bopts.numRoisPerImg = 64;
+bopts.maxScale = 1000;
+bopts.scale = 600;
+bopts.bgLabel = numel(imdb.classes.name)+1;
+bopts.visualize = 0;
+bopts.interpolation = net.meta.normalization.interpolation;
+bopts.numThreads = opts.numFetchThreads;
+bopts.prefetch = opts.train.prefetch;
+
+[net,info] = cnn_train_dag(net, imdb, @(i,b) ...
+                           getBatch(bopts,i,b), ...
+                           opts.train) ;
+
+% --------------------------------------------------------------------
+%                                                               Deploy
+% --------------------------------------------------------------------
+modelPath = fullfile(opts.expDir, 'net-deployed.mat');
+if ~exist(modelPath,'file')
+  net = deployFRCNN(net,imdb);
+  net_ = net.saveobj() ;
+  save(modelPath, '-struct', 'net_') ;
+  clear net_ ;
+end
+
+% --------------------------------------------------------------------
+function inputs = getBatch(opts, imdb, batch)
+% --------------------------------------------------------------------
+opts.visualize = 0;
+
+if isempty(batch)
+  return;
+end
+
+images = strcat([imdb.imageDir filesep], imdb.images.name(batch)) ;
+opts.prefetch = (nargout == 0);
+
+[im,rois,labels,btargets] = fast_rcnn_train_get_batch(images,imdb,...
+  batch, opts);
+
+if opts.prefetch, return; end
+
+nb = numel(labels);
+nc = numel(imdb.classes.name) + 1;
+
+% regression error only for positives
+instance_weights = zeros(1,1,4*nc,nb,'single');
+targets = zeros(1,1,4*nc,nb,'single');
+
+for b=1:nb
+  if labels(b)>0 && labels(b)~=opts.bgLabel
+    targets(1,1,4*(labels(b)-1)+1:4*labels(b),b) = btargets(b,:)';
+    instance_weights(1,1,4*(labels(b)-1)+1:4*labels(b),b) = 1;
+  end
+end
+
+rois = single(rois);
+
+if opts.useGpu > 0
+  im = gpuArray(im) ;
+  rois = gpuArray(rois) ;
+  targets = gpuArray(targets) ;
+  instance_weights = gpuArray(instance_weights) ;
+end
+
+inputs = {'input', im, 'label', labels, 'rois', rois, 'targets', targets, ...
+  'instance_weights', instance_weights} ;
+
+% --------------------------------------------------------------------
+function net = deployFRCNN(net,imdb)
+% --------------------------------------------------------------------
+% function net = deployFRCNN(net)
+for l = numel(net.layers):-1:1
+  if isa(net.layers(l).block, 'dagnn.Loss') || ...
+      isa(net.layers(l).block, 'dagnn.DropOut')
+    layer = net.layers(l);
+    net.removeLayer(layer.name);
+    net.renameVar(layer.outputs{1}, layer.inputs{1}, 'quiet', true) ;
+  end
+end
+
+net.rebuild();
+
+pfc8 = net.getLayerIndex('predcls') ;
+net.addLayer('probcls',dagnn.SoftMax(),net.layers(pfc8).outputs{1},...
+  'probcls',{});
+
+net.vars(net.getVarIndex('probcls')).precious = true ;
+
+idxBox = net.getLayerIndex('predbbox') ;
+if ~isnan(idxBox)
+  net.vars(net.layers(idxBox).outputIndexes(1)).precious = true ;
+  % incorporate mean and std to bbox regression parameters
+  blayer = net.layers(idxBox) ;
+  filters = net.params(net.getParamIndex(blayer.params{1})).value ;
+  biases = net.params(net.getParamIndex(blayer.params{2})).value ;
+  
+  boxMeans = single(imdb.boxes.bboxMeanStd{1}');
+  boxStds = single(imdb.boxes.bboxMeanStd{2}');
+  
+  net.params(net.getParamIndex(blayer.params{1})).value = ...
+    bsxfun(@times,filters,...
+    reshape([boxStds(:)' zeros(1,4,'single')]',...
+    [1 1 1 4*numel(net.meta.classes.name)]));
+
+  biases = biases .* [boxStds(:)' zeros(1,4,'single')];
+  
+  net.params(net.getParamIndex(blayer.params{2})).value = ...
+    bsxfun(@plus,biases, [boxMeans(:)' zeros(1,4,'single')]);
+end
+
+net.mode = 'test' ;
diff --git a/examples/fast_rcnn/fast_rcnn_train_get_batch.m b/examples/fast_rcnn/fast_rcnn_train_get_batch.m
new file mode 100644
index 00000000..ba656628
--- /dev/null
+++ b/examples/fast_rcnn/fast_rcnn_train_get_batch.m
@@ -0,0 +1,166 @@
+function [imo,rois,labels,targets] = fast_rcnn_train_get_batch(images, imdb, batch, opts)
+% FAST_RCNN_GET_BATCH_TRAIN  Generates mini-batches for Fast-RCNN train
+
+% opts.numFgRoisPerImg = 128;
+% opts.numRoisPerImg = 64;
+% opts.maxScale = 1000;
+% opts.bgLabel = 21;
+% opts.visualize = 0;
+% opts.scale = 600;
+% opts.interpolation = 'bicubic';
+% opts.averageImage = [];
+% opts.numThreads = 2;
+% opts.prefetch = true;
+%
+% Copyright (C) 2016 Hakan Bilen.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+if isempty(images)
+  imo = [] ;
+  rois = [] ;
+  labels = [] ;
+  targets = [] ;
+  return ;
+end
+
+% fetch is true if images is a list of filenames (instead of
+% a cell array of images)
+fetch = ischar(images{1}) ;
+
+% prefetch is used to load images in a separate thread
+prefetch = fetch & opts.prefetch ;
+
+
+if prefetch
+  vl_imreadjpeg(images, 'numThreads',opts.numThreads,'prefetch') ;
+  imo = [] ;
+  rois = [] ;
+  labels = [] ;
+  targets = [] ;
+  return ;
+end
+
+if fetch
+  ims = vl_imreadjpeg(images,'numThreads',opts.numThreads) ;
+else
+  ims = images ;
+end
+
+maxW = 0;
+maxH = 0;
+
+% labels = imdb.images.label(:,batch);
+
+pboxes   = cell(1,numel(batch));
+plabels  = cell(1,numel(batch));
+ptargets = cell(1,numel(batch));
+
+% get fg and bg rois
+for b=1:numel(batch)
+  pbox   = imdb.boxes.pbox{batch(b)};
+  plabel = imdb.boxes.plabel{batch(b)};
+  ptarget = imdb.boxes.ptarget{batch(b)};
+
+  if size(pbox,2)~=4
+    error('wrong box size');
+  end
+
+  % get pos boxes
+  pos = find((plabel~=opts.bgLabel) & (plabel > 0)) ;
+  npos = numel(pos);
+  % get neg boxes
+  neg = find((plabel==opts.bgLabel)) ;
+  nneg = numel(neg);
+
+    bbox = [];
+    label = [];
+    target = [];
+
+    opts.numFgRoisPerImg = min(npos,opts.numFgRoisPerImg);
+    nBneg = min(nneg,opts.numRoisPerImg-opts.numFgRoisPerImg);
+
+    if npos>0
+      r = randperm(npos);
+      p = pos(r(1:opts.numFgRoisPerImg));
+      bbox = pbox(p,:);
+      label = plabel(p);
+      target = ptarget(p,:);
+    end
+    if nneg>0
+      r = randperm(nneg);
+
+      n = neg(r(1:nBneg));
+      bbox = [bbox ; pbox(n,:)];
+      label = [label ; plabel(n)];
+      target = [target ; ones(size(ptarget(n,:)))];
+    end
+  pboxes{b} = bbox;
+  plabels{b} = label;
+  ptargets{b} = target;
+end
+
+if isempty(pboxes)
+  warning('No gt box\n');
+end
+
+labels = vertcat(plabels{:});
+targets = vertcat(ptargets{:});
+
+% rescale images and rois
+rois = [];
+imre = cell(1,numel(batch));
+for b=1:numel(batch)
+  imSize = size(ims{b});
+
+  h = imSize(1);
+  w = imSize(2);
+
+  factor = max(opts.scale(1)/h,opts.scale(1)/w);
+
+  if any([h*factor,w*factor]>opts.maxScale)
+    factor = min(opts.maxScale/h,opts.maxScale/w);
+  end
+
+  if abs(factor-1)>1e-3
+    imre{b} = imresize(ims{b},factor,'Method',opts.interpolation);
+  else
+    imre{b} = ims{b};
+  end
+
+  if imdb.boxes.flip(batch(b))
+    im = imre{b};
+    imre{b} = im(:,end:-1:1,:);
+  end
+
+  imreSize = size(imre{b});
+
+  maxH = max(imreSize(1),maxH);
+  maxW = max(imreSize(2),maxW);
+
+  % adapt bounding boxes into new coord
+  bbox = pboxes{b};
+  if any(bbox(:)<=0)
+    error('bbox error');
+  end
+
+  nB = size(bbox,1);
+  tbbox = bbox_scale(bbox,factor,[imreSize(2) imreSize(1)]);
+  if any(tbbox(:)<=0)
+    error('tbbox error');
+  end
+
+  rois = [rois [b*ones(1,nB) ; tbbox' ] ];
+end
+
+imo = zeros(maxH,maxW,size(imre{1},3),numel(batch),'single');
+for b=1:numel(batch)
+  % subtract mean
+  if ~isempty(opts.averageImage)
+    imre{b} = single(bsxfun(@minus,imre{b},opts.averageImage));
+  end
+  sz = size(imre{b});
+  imo(1:sz(1),1:sz(2),:,b) = single(imre{b});
+end
diff --git a/examples/imagenet/cnn_imagenet_deploy.m b/examples/imagenet/cnn_imagenet_deploy.m
index 72c0a15a..c22ecf7e 100644
--- a/examples/imagenet/cnn_imagenet_deploy.m
+++ b/examples/imagenet/cnn_imagenet_deploy.m
@@ -178,8 +178,7 @@ function dagMergeBatchNorm(net)
 % wk / sqrt(sigmak^2 + eps)
 % bk - wk muk / sqrt(sigmak^2 + eps)
 a = multipliers(:) ./ moments(:,2) ;
-b = offsets(:) - moments(:,1) .* a ;
-biases(:) = biases(:) + b(:) ;
+biases(:) = (biases(:) - moments(:,1)) .* a + offsets(:) ;
 sz = size(filters) ;
 numFilters = sz(4) ;
 filters = reshape(bsxfun(@times, reshape(filters, [], numFilters), a'), sz) ;
diff --git a/examples/imagenet/cnn_imagenet_init_resnet.m b/examples/imagenet/cnn_imagenet_init_resnet.m
index 88d0c5d5..1ba073da 100644
--- a/examples/imagenet/cnn_imagenet_init_resnet.m
+++ b/examples/imagenet/cnn_imagenet_init_resnet.m
@@ -32,7 +32,7 @@ function Conv(name, ksize, depth, varargin)
                [name '_conv'], ...
                pars) ;
   net.addLayer([name '_bn'], ...
-               dagnn.BatchNorm('numChannels', depth), ...
+               dagnn.BatchNorm('numChannels', depth, 'epsilon', 1e-5), ...
                [name '_conv'], ...
                [name '_bn'], ...
                {[name '_bn_w'], [name '_bn_b'], [name '_bn_m']}) ;
@@ -95,8 +95,10 @@ function Conv(name, ksize, depth, varargin)
     % ABC: 1x1, 3x3, 1x1; downsample if first segment in section from
     % section 2 onwards.
     lastAdded = sectionInput ;
-    Conv([name 'a'], 1, 2^(s+4), 'downsample', (s >= 3) & l == 1) ;
-    Conv([name 'b'], 3, 2^(s+4)) ;
+    %Conv([name 'a'], 1, 2^(s+4), 'downsample', (s >= 3) & l == 1) ;
+    %Conv([name 'b'], 3, 2^(s+4)) ;
+    Conv([name 'a'], 1, 2^(s+4)) ;
+    Conv([name 'b'], 3, 2^(s+4), 'downsample', (s >= 3) & l == 1) ;
     Conv([name 'c'], 1, 2^(s+6), 'relu', false) ;
 
     % Sum layer
@@ -154,7 +156,7 @@ function Conv(name, ksize, depth, varargin)
 net.meta.augmentation.jitterFlip = true ;
 net.meta.augmentation.jitterBrightness = double(0.1 * opts.colorDeviation) ;
 net.meta.augmentation.jitterAspect = [3/4, 4/3] ;
-net.meta.augmentation.jitterScale  = [0.5, 1.1] ;
+net.meta.augmentation.jitterScale  = [0.4, 1.1] ;
 %net.meta.augmentation.jitterSaturation = 0.4 ;
 %net.meta.augmentation.jitterContrast = 0.4 ;
 
@@ -187,7 +189,6 @@ function Conv(name, ksize, depth, varargin)
   if isa(net.layers(l).block, 'dagnn.BatchNorm')
     k = net.getParamIndex(net.layers(l).params{3}) ;
     net.params(k).learningRate = 0.3 ;
-    net.params(k).epsilon = 1e-5 ;
   end
 end
 
diff --git a/examples/mnist/cnn_mnist_experiments.m b/examples/mnist/cnn_mnist_experiments.m
index d83db80b..a8c3be64 100644
--- a/examples/mnist/cnn_mnist_experiments.m
+++ b/examples/mnist/cnn_mnist_experiments.m
@@ -8,19 +8,21 @@
 
 figure(1) ; clf ;
 subplot(1,2,1) ;
-semilogy(info_fc.val.objective', 'o-') ; hold all ;
-semilogy(info_bn.val.objective', '+--') ;
+semilogy([info_fc.val.objective]', 'o-') ; hold all ;
+semilogy([info_bn.val.objective]', '+--') ;
 xlabel('Training samples [x 10^3]'); ylabel('energy') ;
 grid on ;
 h=legend('BSLN', 'BNORM') ;
 set(h,'color','none');
 title('objective') ;
 subplot(1,2,2) ;
-plot(info_fc.val.error', 'o-') ; hold all ;
-plot(info_bn.val.error', '+--') ;
+plot([info_fc.val.top1err]', 'o-') ; hold all ;
+plot([info_fc.val.top5err]', '*-') ;
+plot([info_bn.val.top1err]', '+--') ;
+plot([info_bn.val.top5err]', 'x--') ;
 h=legend('BSLN-val','BSLN-val-5','BNORM-val','BNORM-val-5') ;
 grid on ;
 xlabel('Training samples [x 10^3]'); ylabel('error') ;
 set(h,'color','none') ;
 title('error') ;
-drawnow ;
\ No newline at end of file
+drawnow ;
diff --git a/examples/mnist/cnn_mnist_init.m b/examples/mnist/cnn_mnist_init.m
index c91b8394..0c5bd7b2 100644
--- a/examples/mnist/cnn_mnist_init.m
+++ b/examples/mnist/cnn_mnist_init.m
@@ -77,5 +77,5 @@
                'weights', {{ones(ndim, 1, 'single'), zeros(ndim, 1, 'single')}}, ...
                'learningRate', [1 1 0.05], ...
                'weightDecay', [0 0]) ;
-net.layers{l}.biases = [] ;
+net.layers{l}.weights{2} = [] ;  % eliminate bias in previous conv layer
 net.layers = horzcat(net.layers(1:l), layer, net.layers(l+1:end)) ;
diff --git a/matconvnet.vcxproj b/matconvnet.vcxproj
index 251f8cf4..2a61b500 100644
--- a/matconvnet.vcxproj
+++ b/matconvnet.vcxproj
@@ -94,7 +94,7 @@
     <None Include="matlab\src\vl_nnnormalize.cu" />
     <None Include="matlab\src\vl_nnpool.cu" />
     <None Include="matlab\src\vl_taccummex.cu" />
-    <None Include="matlab\src\vl_tmovemex.cu" />
+    <None Include="matlab\src\vl_tmove.cu" />
     <None Include="matlab\vl_argparse.m" />
     <None Include="matlab\vl_compilenn.m" />
     <None Include="matlab\vl_imreadjpeg.m" />
@@ -146,7 +146,7 @@
     <ClCompile Include="matlab\src\vl_nnnormalize.cpp" />
     <ClCompile Include="matlab\src\vl_nnpool.cpp" />
     <ClCompile Include="matlab\src\vl_taccummex.cpp" />
-    <ClCompile Include="matlab\src\vl_tmovemex.cpp" />
+    <ClCompile Include="matlab\src\vl_tmove.cpp" />
   </ItemGroup>
   <ItemGroup>
     <ClInclude Include="matlab\src\bits\data.hpp" />
diff --git a/matconvnet.vcxproj.filters b/matconvnet.vcxproj.filters
index 6e6a03f5..ebda8828 100644
--- a/matconvnet.vcxproj.filters
+++ b/matconvnet.vcxproj.filters
@@ -145,7 +145,7 @@
     <None Include="matlab\src\vl_taccummex.cu">
       <Filter>src</Filter>
     </None>
-    <None Include="matlab\src\vl_tmovemex.cu">
+    <None Include="matlab\src\vl_tmove.cu">
       <Filter>src</Filter>
     </None>
     <None Include="matlab\src\bits\nnbilinearsampler.cu">
@@ -254,7 +254,7 @@
     <ClCompile Include="matlab\src\vl_taccummex.cpp">
       <Filter>src</Filter>
     </ClCompile>
-    <ClCompile Include="matlab\src\vl_tmovemex.cpp">
+    <ClCompile Include="matlab\src\vl_tmove.cpp">
       <Filter>src</Filter>
     </ClCompile>
     <ClCompile Include="matlab\src\bits\nnbilinearsampler.cpp">
diff --git a/matconvnet.xcodeproj/project.pbxproj b/matconvnet.xcodeproj/project.pbxproj
index eaca09b6..17d7293c 100644
--- a/matconvnet.xcodeproj/project.pbxproj
+++ b/matconvnet.xcodeproj/project.pbxproj
@@ -221,6 +221,16 @@
 		2D708ACD1A52F65C004E7D42 /* matdocparser.py */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text.script.python; name = matdocparser.py; path = doc/matdocparser.py; sourceTree = "<group>"; };
 		2D717F1F19B3A2A50028FE9E /* matconvnet-manual.tex */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text; name = "matconvnet-manual.tex"; path = "doc/matconvnet-manual.tex"; sourceTree = "<group>"; };
 		2D717F2019B3A2A50028FE9E /* references.bib */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text; name = references.bib; path = doc/references.bib; sourceTree = "<group>"; };
+		2D7A6F6E1D8C5377008F8B22 /* nnroipooling.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = nnroipooling.cpp; path = matlab/src/bits/nnroipooling.cpp; sourceTree = "<group>"; };
+		2D7A6F6F1D8C5377008F8B22 /* nnroipooling.hpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = nnroipooling.hpp; path = matlab/src/bits/nnroipooling.hpp; sourceTree = "<group>"; };
+		2D7A6F701D8C5377008F8B22 /* roipooling_cpu.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = roipooling_cpu.cpp; path = matlab/src/bits/impl/roipooling_cpu.cpp; sourceTree = "<group>"; };
+		2D7A6F711D8C5377008F8B22 /* roipooling.hpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = roipooling.hpp; path = matlab/src/bits/impl/roipooling.hpp; sourceTree = "<group>"; };
+		2D7A6F721D8C5377008F8B22 /* vl_nnroipool.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = vl_nnroipool.cpp; path = matlab/src/vl_nnroipool.cpp; sourceTree = "<group>"; };
+		2D7A6F731D8C5377008F8B22 /* nnbilinearsampler.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; name = nnbilinearsampler.cpp; path = matlab/src/bits/nnbilinearsampler.cpp; sourceTree = "<group>"; };
+		2D7A6F741D8C53D0008F8B22 /* nnroipooling.cu */ = {isa = PBXFileReference; explicitFileType = sourcecode.cpp.objcpp; fileEncoding = 4; name = nnroipooling.cu; path = matlab/src/bits/nnroipooling.cu; sourceTree = "<group>"; xcLanguageSpecificationIdentifier = xcode.lang.cpp; };
+		2D7A6F751D8C53D0008F8B22 /* roipooling_gpu.cu */ = {isa = PBXFileReference; explicitFileType = sourcecode.cpp.objcpp; fileEncoding = 4; name = roipooling_gpu.cu; path = matlab/src/bits/impl/roipooling_gpu.cu; sourceTree = "<group>"; };
+		2D7A6F761D8C53D0008F8B22 /* vl_nnroipool.cu */ = {isa = PBXFileReference; explicitFileType = sourcecode.cpp.cpp; fileEncoding = 4; name = vl_nnroipool.cu; path = matlab/src/vl_nnroipool.cu; sourceTree = "<group>"; xcLanguageSpecificationIdentifier = xcode.lang.cpp; };
+		2D7A6F771D8C58B4008F8B22 /* vl_nnroipool.m */ = {isa = PBXFileReference; explicitFileType = text; fileEncoding = 4; name = vl_nnroipool.m; path = matlab/vl_nnroipool.m; sourceTree = "<group>"; };
 		2D7B112A1A88E5CC00A3D8A0 /* nnconv_blas.hpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = nnconv_blas.hpp; path = matlab/src/bits/impl/nnconv_blas.hpp; sourceTree = "<group>"; };
 		2D7B112D1A88F0FF00A3D8A0 /* nnpooling.cu */ = {isa = PBXFileReference; explicitFileType = sourcecode.cpp.cpp; fileEncoding = 4; name = nnpooling.cu; path = matlab/src/bits/nnpooling.cu; sourceTree = "<group>"; xcLanguageSpecificationIdentifier = xcode.lang.cpp; };
 		2D7B112E1A88F0FF00A3D8A0 /* nnpooling.hpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.h; name = nnpooling.hpp; path = matlab/src/bits/nnpooling.hpp; sourceTree = "<group>"; };
@@ -314,6 +324,7 @@
 			children = (
 				2D375DCE18A84923008A97EE /* bits */,
 				2D6D0420196A892E00022E96 /* config */,
+				2DD177081D31760000B0A17E /* vl_cudatool.cpp */,
 				2D0FBD441D04116E0081FA19 /* vl_cudatool.cu */,
 				2DD177091D31760000B0A17E /* vl_imreadjpeg_old.cpp */,
 				2DD1770A1D31760000B0A17E /* vl_imreadjpeg_old.cu */,
@@ -331,6 +342,8 @@
 				2DADAFF418E63E7800165C90 /* vl_nnnormalize.cu */,
 				2D9DC1CF1A209EFD0053CB7D /* vl_nnpool.cpp */,
 				2DF145CF18AA61BD00D920BA /* vl_nnpool.cu */,
+				2D7A6F721D8C5377008F8B22 /* vl_nnroipool.cpp */,
+				2D7A6F761D8C53D0008F8B22 /* vl_nnroipool.cu */,
 				2D9BC77C1D0ECDE400EC9F94 /* vl_taccummex.cpp */,
 				2D9BC77D1D0ECDE400EC9F94 /* vl_taccummex.cu */,
 				2D4080301CFD7A8C00B85345 /* vl_tmove.cpp */,
@@ -350,7 +363,6 @@
 		2D375DCE18A84923008A97EE /* bits */ = {
 			isa = PBXGroup;
 			children = (
-				2D479D071A88AE0400826D48 /* impl */,
 				2D528B9A1A8284C6006EC40A /* data.cpp */,
 				2D528B9B1A8284C6006EC40A /* data.cu */,
 				2D528B9C1A8284C6006EC40A /* data.hpp */,
@@ -359,12 +371,14 @@
 				2D528B9D1A8284C6006EC40A /* datamex.cpp */,
 				2D528B9E1A8284C6006EC40A /* datamex.cu */,
 				2D528B9F1A8284C6006EC40A /* datamex.hpp */,
+				2D479D071A88AE0400826D48 /* impl */,
 				2DF897C01C4182CE002C7EB9 /* imread.cpp */,
 				2DF07B6E1AAA4068001A3943 /* imread.hpp */,
 				2D528BA41A8284C6006EC40A /* mexutils.h */,
 				2D14F00B1B02AB9800A8F33D /* nnbias.cpp */,
 				2D14F0071B02AB5700A8F33D /* nnbias.cu */,
 				2D14F0081B02AB5700A8F33D /* nnbias.hpp */,
+				2D7A6F731D8C5377008F8B22 /* nnbilinearsampler.cpp */,
 				2DF0C6231CB54CBA005BEF89 /* nnbilinearsampler.cu */,
 				2DF0C6241CB54CBA005BEF89 /* nnbilinearsampler.hpp */,
 				2D80792D1AEF94650040BC14 /* nnbnorm.cpp */,
@@ -382,10 +396,12 @@
 				2D7B11311A88F12000A3D8A0 /* nnpooling.cpp */,
 				2D7B112D1A88F0FF00A3D8A0 /* nnpooling.cu */,
 				2D7B112E1A88F0FF00A3D8A0 /* nnpooling.hpp */,
+				2D7A6F6E1D8C5377008F8B22 /* nnroipooling.cpp */,
+				2D7A6F741D8C53D0008F8B22 /* nnroipooling.cu */,
+				2D7A6F6F1D8C5377008F8B22 /* nnroipooling.hpp */,
 				2D7B11351A8AC85300A3D8A0 /* nnsubsample.cpp */,
 				2DA349BA1A86C5210073185F /* nnsubsample.cu */,
 				2DA349BB1A86C5210073185F /* nnsubsample.hpp */,
-				2DD177081D31760000B0A17E /* vl_cudatool.cpp */,
 			);
 			name = bits;
 			sourceTree = "<group>";
@@ -442,6 +458,9 @@
 				2D528BA91A8284C6006EC40A /* pooling_cpu.cpp */,
 				2D528BAB1A8284C6006EC40A /* pooling_gpu.cu */,
 				2D528BAA1A8284C6006EC40A /* pooling.hpp */,
+				2D7A6F701D8C5377008F8B22 /* roipooling_cpu.cpp */,
+				2D7A6F751D8C53D0008F8B22 /* roipooling_gpu.cu */,
+				2D7A6F711D8C5377008F8B22 /* roipooling.hpp */,
 				2D4E88271C37FAB80074DDEE /* sharedmem.cuh */,
 				2D479D121A88AF4300826D48 /* subsample_cpu.cpp */,
 				2D479D111A88AF4300826D48 /* subsample_gpu.cu */,
@@ -633,6 +652,7 @@
 				2D416C751B39E1C60092638E /* vl_nnpdist.m */,
 				2D5C34D519745588002B399E /* vl_nnpool.m */,
 				2DD3FACD18EC0E7B00053032 /* vl_nnrelu.m */,
+				2D7A6F771D8C58B4008F8B22 /* vl_nnroipool.m */,
 				2D416C761B39E1C60092638E /* vl_nnsigmoid.m */,
 				2DD3FACE18EC0E7B00053032 /* vl_nnsoftmax.m */,
 				2D6D0427196A896300022E96 /* vl_nnsoftmaxloss.m */,
diff --git a/matlab/+dagnn/@DagNN/fromSimpleNN.m b/matlab/+dagnn/@DagNN/fromSimpleNN.m
index d1c81b84..7022c570 100644
--- a/matlab/+dagnn/@DagNN/fromSimpleNN.m
+++ b/matlab/+dagnn/@DagNN/fromSimpleNN.m
@@ -209,6 +209,10 @@
   end
 end
 
+if isfield(obj.meta, 'inputs')
+  obj.meta.inputs(1).name = obj.layers(1).inputs{1} ;
+end
+
 % --------------------------------------------------------------------
 function name = getNewVarName(obj, prefix)
 % --------------------------------------------------------------------
diff --git a/matlab/+dagnn/@DagNN/getVarReceptiveFields.m b/matlab/+dagnn/@DagNN/getVarReceptiveFields.m
index 80274af0..0ee2e1eb 100644
--- a/matlab/+dagnn/@DagNN/getVarReceptiveFields.m
+++ b/matlab/+dagnn/@DagNN/getVarReceptiveFields.m
@@ -21,7 +21,7 @@
 if ~isnumeric(var)
   var_n = obj.getVarIndex(var) ;
   if isnan(var_n)
-    error('Variable %s not found.', var_n);
+    error('Variable %s not found.', var);
   end
   var = var_n;
 end
diff --git a/matlab/+dagnn/@DagNN/getVarSizes.m b/matlab/+dagnn/@DagNN/getVarSizes.m
index 23509057..5d7227e4 100644
--- a/matlab/+dagnn/@DagNN/getVarSizes.m
+++ b/matlab/+dagnn/@DagNN/getVarSizes.m
@@ -29,7 +29,11 @@
   if isnan(v)
     error('Variable `%s` not found in the network.', inputSizes{i});
   end;
-  sizes{v} = [inputSizes{i+1}(:)' ones(1, 4 - numel(inputSizes{i+1}))] ;
+  if isempty(inputSizes{i+1})
+    sizes{v} = [0 0 0 0] ;
+  else
+    sizes{v} = [inputSizes{i+1}(:)' ones(1, 4 - numel(inputSizes{i+1}))] ;
+  end
 end
 
 for layer = obj.layers(obj.executionOrder)
diff --git a/matlab/+dagnn/@DagNN/loadobj.m b/matlab/+dagnn/@DagNN/loadobj.m
index c98db380..f943e377 100644
--- a/matlab/+dagnn/@DagNN/loadobj.m
+++ b/matlab/+dagnn/@DagNN/loadobj.m
@@ -21,22 +21,17 @@
     return;
   end
   obj = dagnn.DagNN() ;
-  try
-    for l = 1:numel(s.layers)
-      constr = str2func(s.layers(l).type) ;
-      block = constr() ;
-      block.load(struct(s.layers(l).block)) ;
-      obj.addLayer(...
-        s.layers(l).name, ...
-        block, ...
-        s.layers(l).inputs, ...
-        s.layers(l).outputs, ...
-        s.layers(l).params,...
-        'skipRebuild', true) ;
-    end
-  catch e % Make sure the DagNN object is in valid state
-    obj.rebuild();
-    rethrow(e);
+  for l = 1:numel(s.layers)
+    constr = str2func(s.layers(l).type) ;
+    block = constr() ;
+    block.load(struct(s.layers(l).block)) ;
+    obj.addLayer(...
+      s.layers(l).name, ...
+      block, ...
+      s.layers(l).inputs, ...
+      s.layers(l).outputs, ...
+      s.layers(l).params,...
+      'skipRebuild', true) ;
   end
   obj.rebuild();
   if isfield(s, 'params')
diff --git a/matlab/+dagnn/@DagNN/renameParam.m b/matlab/+dagnn/@DagNN/renameParam.m
new file mode 100644
index 00000000..1ab6a3e8
--- /dev/null
+++ b/matlab/+dagnn/@DagNN/renameParam.m
@@ -0,0 +1,37 @@
+function renameParam(obj, oldName, newName, varargin)
+%RENAMELAYER Rename a parameter
+%   RENAMEPARAM(OLDNAME, NEWNAME) changes the name of the parameter
+%   OLDNAME into NEWNAME. NEWNAME should not be the name of an
+%   existing parameter.
+
+opts.quiet = false ;
+opts = vl_argparse(opts, varargin) ;
+
+% Find the param to rename
+v = obj.getParamIndex(oldName) ;
+if isnan(v)
+  % There is no such param, nothing to do
+  if ~opts.quiet
+    warning('There is no parameter ''%s''.', oldName) ;
+  end
+  return ;
+end
+
+% Check if newName is an existing param
+newNameExists = any(strcmp(newName, {obj.params.name})) ;
+if newNameExists
+  error('There is already a layer ''%s''.', newName) ;
+end
+
+% Replace oldName with newName in all the layers
+for l = 1:numel(obj.layers)
+    sel = find(strcmp(oldName, obj.layers(l).params));
+    [obj.layers(l).params{sel}] = deal(newName) ;
+end
+
+if ~newNameExists
+  obj.params(v).name = newName ;
+  obj.paramNames.(newName) = v ;
+end
+
+obj.rebuild() ;
\ No newline at end of file
diff --git a/matlab/+dagnn/Loss.m b/matlab/+dagnn/Loss.m
index e70642a8..a9675b26 100644
--- a/matlab/+dagnn/Loss.m
+++ b/matlab/+dagnn/Loss.m
@@ -1,6 +1,7 @@
 classdef Loss < dagnn.ElementWise
   properties
     loss = 'softmaxlog'
+    ignoreAverage = false
     opts = {}
   end
 
@@ -12,9 +13,14 @@
   methods
     function outputs = forward(obj, inputs, params)
       outputs{1} = vl_nnloss(inputs{1}, inputs{2}, [], 'loss', obj.loss, obj.opts{:}) ;
+      obj.accumulateAverage(inputs, outputs);
+    end
+
+    function accumulateAverage(obj, inputs, outputs)
+      if obj.ignoreAverage, return; end;
       n = obj.numAveraged ;
-      m = n + size(inputs{1},4) ;
-      obj.average = (n * obj.average + gather(outputs{1})) / m ;
+      m = n + size(inputs{1}, 1) *  size(inputs{1}, 2) * size(inputs{1}, 4);
+      obj.average = bsxfun(@plus, n * obj.average, gather(outputs{1})) / m ;
       obj.numAveraged = m ;
     end
 
diff --git a/matlab/+dagnn/PDist.m b/matlab/+dagnn/PDist.m
new file mode 100644
index 00000000..f52b731a
--- /dev/null
+++ b/matlab/+dagnn/PDist.m
@@ -0,0 +1,49 @@
+%PDIST vl_nnpdist dagnn wrapper
+%  Accepts 2 or 3 inputs, where third input is used as variable
+%  'instanceWeights' parameter. Derivatives for the 3rd input are not
+%  computed.
+%  By default aggregates the element-wise loss.
+classdef PDist < dagnn.Loss
+  properties
+    p = 2;
+    aggregate = true;
+  end
+
+  methods
+    function outputs = forward(obj, inputs, params)
+      switch numel(inputs)
+        case 2
+          outputs{1} = vl_nnpdist(inputs{1}, inputs{2}, obj.p, [], ...
+            'aggregate', obj.aggregate, obj.opts{:}) ;
+        case 3
+          outputs{1} = vl_nnpdist(inputs{1}, inputs{2}, obj.p, [], ...
+            'aggregate', obj.aggregate, 'instanceWeights', inputs{3}, ...
+            obj.opts{:}) ;
+        otherwise
+          error('Invalid number of inputs');
+      end
+      obj.accumulateAverage(inputs, outputs);
+    end
+
+    function [derInputs, derParams] = backward(obj, inputs, params, derOutputs)
+      derInputs = cell(1, numel(inputs));
+      switch numel(inputs)
+        case 2
+          [derInputs{1}, derInputs{2}] = vl_nnpdist(inputs{1}, inputs{2}, ...
+            obj.p, derOutputs{1}, 'aggregate', obj.aggregate, obj.opts{:}) ;
+        case 3
+          [derInputs{1}, derInputs{2}] = vl_nnpdist(inputs{1}, inputs{2}, ...
+            obj.p, derOutputs{1}, 'aggregate', obj.aggregate, ...
+            'instanceWeights', inputs{3}, obj.opts{:}) ;
+        otherwise
+          error('Invalid number of inputs');
+      end
+      derParams = {} ;
+    end
+
+    function obj = PDist(varargin)
+      obj.load(varargin) ;
+      obj.loss = 'pdist';
+    end
+  end
+end
diff --git a/matlab/+dagnn/ROIPooling.m b/matlab/+dagnn/ROIPooling.m
new file mode 100644
index 00000000..2c7172ee
--- /dev/null
+++ b/matlab/+dagnn/ROIPooling.m
@@ -0,0 +1,59 @@
+classdef ROIPooling < dagnn.Layer
+  % DAGNN.ROIPOOLING  Region of interest pooling layer
+
+  % Copyright (C) 2016 Hakan Bilen.
+  % All rights reserved.
+  %
+  % This file is part of the VLFeat library and is made available under
+  % the terms of the BSD license (see the COPYING file).
+
+  properties
+    method = 'max'
+    subdivisions = [6 6]
+    transform = 1
+    flatten = false
+  end
+
+  methods
+    function outputs = forward(obj, inputs, params)
+      numROIs = numel(inputs{2}) / 5 ;
+      outputs{1} = vl_nnroipool(...
+        inputs{1}, inputs{2}, ...
+        'subdivisions', obj.subdivisions, ...
+        'transform', obj.transform, ...
+        'method', obj.method) ;
+      if obj.flatten
+        outputs{1} = reshape(outputs{1},1,1,[],numROIs) ;
+      end
+    end
+
+    function [derInputs, derParams] = backward(obj, inputs, params, derOutputs)
+      numROIs = numel(inputs{2}) / 5 ;
+      if obj.flatten
+        % unflatten
+        derOutputs{1} = reshape(...
+          derOutputs{1},obj.subdivisions(1),obj.subdivisions(2),[],numROIs) ;
+      end
+      derInputs{1} = vl_nnroipool(...
+        inputs{1}, inputs{2}, derOutputs{1}, ...
+        'subdivisions', obj.subdivisions, ...
+        'transform', obj.transform, ...
+        'method', obj.method) ;
+      derInputs{2} = [];
+      derParams = {} ;
+    end
+
+    function outputSizes = getOutputSizes(obj, inputSizes)
+      if isempty(inputSizes{1})
+        n = 0 ;
+      else
+        n = prod(inputSizes{2})/5 ;
+      end
+      outputSizes{1} = [obj.subdivisions, inputSizes{1}(3), n] ;
+    end
+
+    function obj = ROIPooling(varargin)
+      obj.load(varargin) ;
+    end
+  end
+end
diff --git a/matlab/simplenn/vl_simplenn_tidy.m b/matlab/simplenn/vl_simplenn_tidy.m
index 12f034e8..575909eb 100644
--- a/matlab/simplenn/vl_simplenn_tidy.m
+++ b/matlab/simplenn/vl_simplenn_tidy.m
@@ -31,11 +31,29 @@
   tnet.meta.normalization = net.normalization ;
 end
 
+% Adjust for the new version of vl_imreadjpeg
+if  isfield(tnet, 'meta') && isfield(tnet.meta, 'normalization') && ...
+   ~isfield(tnet.meta.normalization, 'cropSize') && ...
+    isfield(tnet.meta.normalization, 'border') && ...
+    isfield(tnet.meta.normalization, 'imageSize')
+  insz = tnet.meta.normalization.imageSize(1:2);
+  bigimSz = insz + tnet.meta.normalization.border;
+  tnet.meta.normalization.cropSize = insz ./ bigimSz;
+end
+
 % copy layers
 for l = 1:numel(net.layers)
   defaults = {'name', sprintf('layer%d', l), 'precious', false};
   layer = net.layers{l} ;
 
+  % Ignore custom layers (e.g. for classes the `isfield` does not work)
+  % The only interface requirement for custom layers is forward and
+  % backward function.
+  if strcmp(layer.type, 'custom')
+    tnet.layers{l} = layer ;
+    continue;
+  end
+
   % check weights format
   switch layer.type
     case {'conv', 'convt', 'bnorm'}
diff --git a/matlab/src/bits/data.hpp b/matlab/src/bits/data.hpp
index 5f98d22b..04c3859b 100644
--- a/matlab/src/bits/data.hpp
+++ b/matlab/src/bits/data.hpp
@@ -16,15 +16,13 @@ the terms of the BSD license (see the COPYING file).
 #include <cstddef>
 #include <string>
 
+#include "impl/compat.h"
+
 #define STRINGIZE(x) STRINGIZE_HELPER(x)
 #define STRINGIZE_HELPER(x) #x
 #define FILELINE STRINGIZE(__FILE__) ":" STRINGIZE(__LINE__)
 #define divides(a,b) ((b) == (b)/(a)*(a))
 
-#ifdef _MSC_VER
-#define __func__ __FUNCTION__
-#endif
-
 #if ENABLE_DOUBLE
 #define IF_DOUBLE(x) x
 #else
diff --git a/matlab/src/bits/impl/bilinearsampler_gpu.cu b/matlab/src/bits/impl/bilinearsampler_gpu.cu
index 3b6ed8a5..794f9a58 100644
--- a/matlab/src/bits/impl/bilinearsampler_gpu.cu
+++ b/matlab/src/bits/impl/bilinearsampler_gpu.cu
@@ -244,7 +244,7 @@ forward_backward
  size_t outHeight, size_t outWidth, size_t outDepth, size_t outCardinality,
  size_t inHeight, size_t inWidth, size_t inCardinality)
 {
-  bool backward = backwardData || backwardGrid ;
+  //bool backward = backwardData || backwardGrid ;
   // common conditions
   assert(grid) ;
   assert(divides(inCardinality, outCardinality)) ;
diff --git a/matlab/src/bits/impl/compat.h b/matlab/src/bits/impl/compat.h
new file mode 100644
index 00000000..eab08624
--- /dev/null
+++ b/matlab/src/bits/impl/compat.h
@@ -0,0 +1,35 @@
+#ifndef COMPAT_H
+#define COMPAT_H
+
+#ifdef _MSC_VER
+#define snprintf _snprintf
+#define vsnprintf _vsnprintf
+#define __func__ __FUNCTION__
+#undef max
+#undef min
+
+#ifdef  _WIN64
+typedef signed __int64 ssize_t;
+#else
+typedef signed int ssize_t;
+#endif // _WIN64
+
+#if _MSC_VER < 1700
+#define false 0
+#define true 1
+#elif _MSC_VER > 1700
+#include <stdbool.h>
+#endif // _MSC_VER < 1700
+
+#if _MSC_VER < 1800
+// Add some missing functions from C99
+#define isnan(x) _isnan(x)
+#define isinf(x) (!_finite(x))
+#define round(x) (x >= 0.0 ? (double)(int)(x + 0.5) : (double)(int)(x - 0.5))
+#define roundf(x) (x >= 0.0f ? (float)(int)(x + 0.5f) : (float)(int)(x - 0.5f))
+#endif
+
+#endif // _MSC_VER
+
+
+#endif // COMPAT_H
diff --git a/matlab/src/bits/impl/imread_libjpeg.cpp b/matlab/src/bits/impl/imread_libjpeg.cpp
index dd7c0f9d..5f30d0fd 100644
--- a/matlab/src/bits/impl/imread_libjpeg.cpp
+++ b/matlab/src/bits/impl/imread_libjpeg.cpp
@@ -68,8 +68,6 @@ vl::ErrorCode
 vl::ImageReader::Impl::readPixels(float * memory, char const * filename)
 {
   vl::ErrorCode error = vl::VLE_Success ;
-  int row_stride ;
-  const int blockSize = 32 ;
   char unsigned * pixels = NULL ;
   JSAMPARRAY scanlines = NULL ;
   bool requiresAbort = false ;
@@ -81,11 +79,14 @@ vl::ImageReader::Impl::readPixels(float * memory, char const * filename)
   FILE* fp = fopen(filename, "r") ;
   if (fp == NULL) {
     error = vl::VLE_Unknown ;
+    std::snprintf(lastErrorMessage,  sizeof(lastErrorMessage),
+                  "imread_libjpeg: unable to open %s", filename) ;
     return error ;
   }
 
   /* handle LibJPEG errors */
   if (setjmp(onJpegError)) {
+    requiresAbort = true;
     error = vl::VLE_Unknown ;
     std::snprintf(lastErrorMessage,  sizeof(lastErrorMessage),
                   "libjpeg: %s", jpegLastErrorMsg) ;
@@ -170,6 +171,8 @@ vl::ImageReader::Impl::readShape(vl::ImageShape & shape, char const * filename)
   FILE* fp = fopen(filename, "r") ;
   if (fp == NULL) {
     error = vl::VLE_Unknown ;
+    std::snprintf(lastErrorMessage,  sizeof(lastErrorMessage),
+                  "imread_libjpeg: unable to open %s", filename) ;
     return error ;
   }
 
diff --git a/matlab/src/bits/impl/normalize.hpp b/matlab/src/bits/impl/normalize.hpp
index cdad4381..431b71d5 100644
--- a/matlab/src/bits/impl/normalize.hpp
+++ b/matlab/src/bits/impl/normalize.hpp
@@ -25,7 +25,7 @@ namespace vl { namespace impl {
     forward(type* output,
             type const* data,
             size_t height, size_t width, size_t depth, size_t size,
-            size_t normDetph,
+            size_t normDepth,
             type  kappa, type  alpha, type  beta) ;
 
     static vl::ErrorCode
@@ -33,7 +33,7 @@ namespace vl { namespace impl {
              type const* data,
              type const* derOutput,
              size_t height, size_t width, size_t depth, size_t size,
-             size_t normDetph,
+             size_t normDepth,
              type  kappa, type  alpha, type  beta) ;
   } ;
 
diff --git a/matlab/src/bits/impl/roipooling.hpp b/matlab/src/bits/impl/roipooling.hpp
new file mode 100644
index 00000000..6d2fbbbb
--- /dev/null
+++ b/matlab/src/bits/impl/roipooling.hpp
@@ -0,0 +1,71 @@
+// @file roipooling.hpp
+// @brief roipooling block implementation
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+#ifndef VL_ROIPOOLING_H
+#define VL_ROIPOOLING_H
+
+#include "../data.hpp"
+#include <cstddef>
+
+namespace vl { namespace impl {
+
+    template<vl::DeviceType dev, typename type>
+    struct roipooling_max {
+      typedef type data_type ;
+
+      static vl::ErrorCode
+      forward(type* output,
+              type const* data,
+              size_t height, size_t width, size_t depth, size_t size,
+              type const* rois,
+              size_t numROIs,
+              int const subdivisions[2],
+              double const transform[6]) ;
+
+      static vl::ErrorCode
+      backward(type* derData,
+               type const* data,
+               size_t height, size_t width, size_t depth, size_t size,
+               type const* rois,
+               size_t numROIs,
+               type const* derOutput,
+               int const subdivisions[2],
+               double const transform[6]) ;
+    };
+
+    template<vl::DeviceType dev, typename type>
+    struct roipooling_average {
+      typedef type data_type ;
+
+      static vl::ErrorCode
+      forward(type* output,
+              type const* data,
+              size_t height, size_t width, size_t depth, size_t size,
+              type const* rois,
+              size_t numROIs,
+              int const subdivisions[2],
+              double const transform[6]) ;
+
+      static vl::ErrorCode
+      backward(type* derData,
+               type const* data, // <- todo: this is not needed for avg pooling
+               size_t height, size_t width, size_t depth, size_t size,
+               type const* rois,
+               size_t numROIs,
+               type const* derOutput,
+               int const subdivisions[2],
+               double const transform[6]) ;
+    };
+} }
+#endif /* defined(VL_ROIPOOLING_H) */
diff --git a/matlab/src/bits/impl/roipooling_cpu.cpp b/matlab/src/bits/impl/roipooling_cpu.cpp
new file mode 100644
index 00000000..757f7410
--- /dev/null
+++ b/matlab/src/bits/impl/roipooling_cpu.cpp
@@ -0,0 +1,360 @@
+// @file roipooling_cpu.cpp
+// @brief Pooling block implementation (CPU)
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+#include "matrix.h"
+#include "../data.hpp"
+#include "roipooling.hpp"
+
+#include <limits>
+#include <algorithm>
+#include <cmath>
+
+using std::max ;
+using std::min ;
+
+/* ---------------------------------------------------------------- */
+/*                                            max roipooling helper */
+/* ---------------------------------------------------------------- */
+
+template <typename type>
+struct acc_max
+{
+  inline acc_max(int poolHeight, int poolWidth, type derOutput = 0)
+  :
+  value(-std::numeric_limits<type>::infinity()),
+  derOutput(derOutput),
+  derDataActivePt(NULL)
+  { }
+
+  inline void accumulate_forward(type x) {
+    value = std::max(value, x) ;
+  }
+
+  inline void accumulate_backward(type const* data, type* derDataPt) {
+    type x = *data ;
+    if (x > value) {
+      value = x ;
+      derDataActivePt = derDataPt ;
+    }
+  }
+
+  inline type done_forward() const {
+    return value ;
+  }
+
+  inline void done_backward() const {
+    if (derDataActivePt) { *derDataActivePt += derOutput ; }
+  }
+
+  type value ;
+  type derOutput ;
+  type* derDataActivePt ;
+} ;
+
+/* ---------------------------------------------------------------- */
+/*                                        average roipooling helper */
+/* ---------------------------------------------------------------- */
+
+template <typename type>
+struct acc_sum
+{
+  inline acc_sum(int poolHeight, int poolWidth, type derOutput = 0)
+  :
+  value(0),
+  scale(type(1)/type(poolHeight*poolWidth)),
+  derOutput(derOutput)
+  { }
+
+  inline void accumulate_forward(type x) {
+    value += x ;
+  }
+
+  inline void accumulate_backward(type const* data, type* derDataPt) {
+    *derDataPt += derOutput * scale ;
+  }
+
+  inline type done_forward() const {
+    return value * scale ;
+  }
+
+  inline void done_backward() const { }
+
+  type value ;
+  type derOutput ;
+  type scale;
+} ;
+
+/* ---------------------------------------------------------------- */
+/*                                             roipooling_*_forward */
+/* ---------------------------------------------------------------- */
+
+template<typename type, typename Accumulator> static inline void
+roipooling_forward_cpu(type* pooled,
+                       type const* data,
+                       size_t height, size_t width, size_t depth, size_t size,
+                       type const* rois,
+                       size_t numROIs,
+                       int const subdivisions[2],
+                       double const transform[6])
+{
+  // For each ROI R = [t x1 y1 x2 y2].
+  for (int roi = 0; roi < numROIs; ++roi) {
+
+    // Apply scale and offset to each ROI coordinate.
+    type u1_ = rois[5 * roi + 1] ;
+    type v1_ = rois[5 * roi + 2] ;
+    type u2_ = rois[5 * roi + 3] ;
+    type v2_ = rois[5 * roi + 4] ;
+
+    type u1 = transform[0] * u1_ + transform[2] * v1_ + transform[4] ;
+    type v1 = transform[1] * u1_ + transform[3] * v1_ + transform[5] ;
+    type u2 = transform[0] * u2_ + transform[2] * v2_ + transform[4] ;
+    type v2 = transform[1] * u2_ + transform[3] * v2_ + transform[5] ;
+
+    // First and last pixel of each ROI (rounded
+    // for compatibility with the Caffe definition).
+    int roi_image   = (int)rois[5 * roi + 0];
+    int roi_start_h = (int)round(v1) - 1 ;
+    int roi_start_w = (int)round(u1) - 1 ;
+    int roi_end_h   = (int)round(v2) - 1 ;
+    int roi_end_w   = (int)round(u2) - 1 ;
+    int roi_height  = max(roi_end_h - roi_start_h + 1, 1) ;
+    int roi_width   = max(roi_end_w - roi_start_w + 1, 1) ;
+
+    roi_image = min(max(roi_image - 1,0), (int)size - 1) ;
+    type const * data_offset = data + (roi_image * depth) * (width*height) ;
+
+    type bin_size_h = (type)roi_height / subdivisions[0] ;
+    type bin_size_w = (type)roi_width / subdivisions[1] ;
+
+    // For each feature channel.
+    for (int z = 0; z < depth; ++z) {
+
+      // For each column of tiles.
+      for (int pw = 0; pw < subdivisions[1]; ++pw) {
+        int wstart = (int)floor(((type)pw) * bin_size_w) ;
+        int wend = (int)ceil(((type)(pw + 1)) * bin_size_w) ;
+        wstart = min(max(wstart + roi_start_w, 0), (int)width) ;
+        wend = min(max(wend + roi_start_w, 0), (int)width) ;
+
+        // For each tile in a column.
+        for (int ph = 0; ph < subdivisions[0]; ++ph) {
+          int hstart = (int)floor(((type)ph) * bin_size_h) ;
+          int hend = (int)ceil(((type)(ph + 1)) * bin_size_h) ;
+          hstart = min(max(hstart + roi_start_h, 0), (int)height) ;
+          hend = min(max(hend + roi_start_h, 0), (int)height) ;
+
+          bool is_empty = (hend <= hstart) || (wend <= wstart);
+
+          if (is_empty) {
+            *pooled++ = 0 ;
+          }
+          else {
+            Accumulator acc(hend - hstart, wend - wstart) ;
+            for (int w = wstart ; w < wend; ++w) {
+              for (int h = hstart ; h < hend; ++h) {
+                const int index = w * height + h ;
+                acc.accumulate_forward(data_offset[index]) ;
+              }
+            }
+            *pooled++ = acc.done_forward() ;
+          }
+        } // end of ph
+      } // end of pw
+      data_offset += width*height;
+    } // end of z
+  } // end of n
+}
+
+/* ---------------------------------------------------------------- */
+/*                                            roipooling_*_backward */
+/* ---------------------------------------------------------------- */
+
+/*
+ assume the output array to be cleared or otherwise
+ properly initialised: accumulates the derivative
+ */
+
+template<typename type, typename Accumulator> static inline void
+roipooling_backward_cpu (type* derData,
+                         type const* data,
+                         size_t height, size_t width, size_t depth, size_t size,
+                         type const* rois,
+                         size_t numROIs,
+                         type const* derOutput,
+                         int const subdivisions[2],
+                         double const transform[6])
+{
+  // For each ROI R = [t x1 y1 x2 y2].
+  for (size_t roi = 0; roi < numROIs ; ++roi) {
+
+    // Apply sacle and offset to each ROI coordinate.
+    type u1_ = rois[5 * roi + 1] ;
+    type v1_ = rois[5 * roi + 2] ;
+    type u2_ = rois[5 * roi + 3] ;
+    type v2_ = rois[5 * roi + 4] ;
+
+    type u1 = transform[0] * u1_ + transform[2] * v1_ + transform[4] ;
+    type v1 = transform[1] * u1_ + transform[3] * v1_ + transform[5] ;
+    type u2 = transform[0] * u2_ + transform[2] * v2_ + transform[4] ;
+    type v2 = transform[1] * u2_ + transform[3] * v2_ + transform[5] ;
+
+    // First and last pixel of each ROI (rounded
+    // for compatibility with the Caffe definition).
+    int roi_image   = (int)rois[5 * roi + 0];
+    int roi_start_h = (int)round(v1) - 1 ;
+    int roi_start_w = (int)round(u1) - 1 ;
+    int roi_end_h   = (int)round(v2) - 1 ;
+    int roi_end_w   = (int)round(u2) - 1 ;
+    int roi_height = max(roi_end_h - roi_start_h + 1, 1) ;
+    int roi_width = max(roi_end_w - roi_start_w + 1, 1) ;
+
+    roi_image = min(max(roi_image - 1,0), (int)size - 1) ;
+    type const * data_offset = data + (roi_image * depth) * (width*height);
+    type * derData_offset = derData + (roi_image * depth) * (width*height);
+
+    const type bin_size_h = (double)roi_height / subdivisions[0] ;
+    const type bin_size_w = (double)roi_width / subdivisions[1] ;
+
+    // For each feature channel.
+    for (int z = 0; z < depth; ++z) {
+
+      // For each column of tiles.
+      for (int pw = 0; pw < subdivisions[1]; ++pw) {
+        int wstart = (int)floor(((type)pw) * bin_size_w) ;
+        int wend = (int)ceil(((type)(pw + 1)) * bin_size_w) ;
+        wstart = min(max(wstart + roi_start_w, 0), (int)width) ;
+        wend = min(max(wend + roi_start_w, 0), (int)width) ;
+
+        // For each tile in a column.
+        for (int ph = 0; ph < subdivisions[0]; ++ph) {
+          int hstart = (int)floor(((type)ph) * bin_size_h) ;
+          int hend = (int)ceil(((type)(ph + 1)) * bin_size_h) ;
+          hstart = min(max(hstart + roi_start_h, 0), (int)height) ;
+          hend = min(max(hend + roi_start_h, 0), (int)height) ;
+
+          Accumulator acc(hend - hstart, wend - wstart, *derOutput++) ;
+          for (int w = wstart; w < wend; ++w) {
+            for (int h = hstart; h < hend; ++h) {
+              const int index = w * height + h ;
+              acc.accumulate_backward(&data_offset[index],
+                                      &derData_offset[index]) ;
+            }
+          }
+          acc.done_backward() ;
+        } // end of pw
+      } // end of ph
+      data_offset += width*height ;
+      derData_offset += width*height ;
+    } // end of z
+  } // end of n
+}
+
+/* ---------------------------------------------------------------- */
+/*                                                        Interface */
+/* ---------------------------------------------------------------- */
+
+namespace vl { namespace impl {
+
+  template <typename type>
+  struct roipooling_max<vl::VLDT_CPU, type>
+  {
+    static vl::ErrorCode
+    forward(type* output,
+            type const* data,
+            size_t height, size_t width, size_t depth, size_t size,
+            type const* rois,
+            size_t numROIs,
+            int const subdivisions[2],
+            double const transform[6])
+    {
+      roipooling_forward_cpu<type, acc_max<type> > (output,
+                                                    data, height, width, depth, size,
+                                                    rois, numROIs,
+                                                    subdivisions, transform) ;
+      return VLE_Success ;
+    }
+
+    static vl::ErrorCode
+    backward(type* derData,
+             type const* data,
+             size_t height, size_t width, size_t depth, size_t size,
+             type const* rois,
+             size_t numROIs,
+             type const* derOutput,
+             int const subdivisions[2],
+             double const transform[6])
+    {
+      roipooling_backward_cpu<type, acc_max<type> > (derData,
+                                                     data, height, width, depth, size,
+                                                     rois, numROIs,
+                                                     derOutput,
+                                                     subdivisions, transform) ;
+      return VLE_Success ;
+    }
+  } ; // roipooling_max
+
+
+  template <typename type>
+  struct roipooling_average<vl::VLDT_CPU, type>
+  {
+    static vl::ErrorCode
+    forward(type* output,
+            type const* data,
+            size_t height, size_t width, size_t depth, size_t size,
+            type const* rois,
+            size_t numROIs,
+            int const subdivisions[2],
+            double const transform[6])
+    {
+      roipooling_forward_cpu<type, acc_sum<type> > (output,
+                                                    data, height, width, depth, size,
+                                                    rois, numROIs,
+                                                    subdivisions, transform) ;
+      return VLE_Success ;
+    }
+
+    static vl::ErrorCode
+    backward(type* derData,
+             type const* data, // <- this is not needed for avg pooling
+             size_t height, size_t width, size_t depth, size_t size,
+             type const* rois,
+             size_t numROIs,
+             type const* derOutput,
+             int const subdivisions[2],
+             double const transform[6])
+    {
+      roipooling_backward_cpu<type, acc_sum<type> > (derData,
+                                                     data, height, width, depth, size,
+                                                     rois, numROIs,
+                                                     derOutput,
+                                                     subdivisions, transform) ;
+      return VLE_Success ;
+    }
+  } ; // roipooling_average
+
+} } ; // namespace vl::impl
+
+// Instantiations
+template struct vl::impl::roipooling_average<vl::VLDT_CPU, float> ;
+template struct vl::impl::roipooling_max<vl::VLDT_CPU, float> ;
+
+#ifdef ENABLE_DOUBLE
+template struct vl::impl::roipooling_average<vl::VLDT_CPU, double> ;
+template struct vl::impl::roipooling_max<vl::VLDT_CPU, double> ;
+#endif
+
+
+
+
diff --git a/matlab/src/bits/impl/roipooling_gpu.cu b/matlab/src/bits/impl/roipooling_gpu.cu
new file mode 100644
index 00000000..79853d4a
--- /dev/null
+++ b/matlab/src/bits/impl/roipooling_gpu.cu
@@ -0,0 +1,384 @@
+// @file roipooling_gpu.cu
+// @brief Region of interest pooling block implementation (GPU)
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+#include "roipooling.hpp"
+#include "../datacu.hpp"
+#include <assert.h>
+#include <cfloat>
+#include <algorithm>
+#include <sm_20_atomic_functions.h>
+
+
+/* ---------------------------------------------------------------- */
+/*                                                          Helpers */
+/* ---------------------------------------------------------------- */
+
+template<typename T>
+struct Geom {
+  int subdivisions[2] ;
+  T transform[6] ;
+  Geom(int const subdivisions[2], double const transform[6])
+  {
+    this->subdivisions[0] = subdivisions[0] ;
+    this->subdivisions[1] = subdivisions[1] ;
+    this->transform[0] = transform[0] ;
+    this->transform[1] = transform[1] ;
+    this->transform[2] = transform[2] ;
+    this->transform[3] = transform[3] ;
+    this->transform[4] = transform[4] ;
+    this->transform[5] = transform[5] ;
+  }
+} ;
+
+struct Bounds {
+  int image, offset, hstart, hend, wstart, wend ;
+  bool isEmpty ;
+} ;
+
+template<typename T>
+__device__ __forceinline__ static Bounds
+getBounds(int outputIndex,
+          int height, int width, int numChannels, int size,
+          const T* rois, int numROIs,
+          Geom<T> geom)
+{
+  Bounds b ;
+
+  int ph = outputIndex ;
+  int pw = ph / geom.subdivisions[0] ;
+  int pc = pw / geom.subdivisions[1] ;
+  int pr = pc / numChannels ;
+
+  ph %= geom.subdivisions[0] ;
+  pw %= geom.subdivisions[1] ;
+  pc %= numChannels ;
+
+  rois += 5 * pr ;
+
+  // Apply sacle and offset to each ROI coordinate.
+  T u1_ = rois[1] ;
+  T v1_ = rois[2] ;
+  T u2_ = rois[3] ;
+  T v2_ = rois[4] ;
+
+  T u1 = geom.transform[0] * u1_ + geom.transform[2] * v1_ + geom.transform[4] ;
+  T v1 = geom.transform[1] * u1_ + geom.transform[3] * v1_ + geom.transform[5] ;
+  T u2 = geom.transform[0] * u2_ + geom.transform[2] * v2_ + geom.transform[4] ;
+  T v2 = geom.transform[1] * u2_ + geom.transform[3] * v2_ + geom.transform[5] ;
+
+  // First and last pixel of each ROI (rounded
+  // for compatibility with the Caffe definition).
+  int roi_image   = (int)rois[0];
+  int roi_start_h = (int)round(v1) - 1 ;
+  int roi_start_w = (int)round(u1) - 1 ;
+  int roi_end_h   = (int)round(v2) - 1 ;
+  int roi_end_w   = (int)round(u2) - 1 ;
+  int roi_height  = max(roi_end_h - roi_start_h + 1, 1) ;
+  int roi_width   = max(roi_end_w - roi_start_w + 1, 1) ;
+
+  T bin_size_h = (T)roi_height / geom.subdivisions[0] ;
+  T bin_size_w = (T)roi_width / geom.subdivisions[1] ;
+
+  roi_image = min(max(roi_image - 1,0), (int)size - 1) ;
+  b.offset = (roi_image * numChannels + pc) * (width*height) ;
+
+  b.wstart = (int)floor(((T)pw) * bin_size_w) ;
+  b.wend = (int)ceil(((T)(pw + 1)) * bin_size_w) ;
+  b.wstart = min(max(b.wstart + roi_start_w, 0), (int)width) ;
+  b.wend = min(max(b.wend + roi_start_w, 0), (int)width) ;
+
+  b.hstart = (int)floor(((T)ph) * bin_size_h) ;
+  b.hend = (int)ceil(((T)(ph + 1)) * bin_size_h) ;
+  b.hstart = min(max(b.hstart + roi_start_h, 0), (int)height) ;
+  b.hend = min(max(b.hend + roi_start_h, 0), (int)height) ;
+
+  b.isEmpty = (b.hend <= b.hstart) || (b.wend <= b.wstart) ;
+
+  return b ;
+}
+
+/* ---------------------------------------------------------------- */
+/*                                       roipooling_average_forward */
+/* ---------------------------------------------------------------- */
+
+template<typename T> __global__ void
+roipooling_average_kernel
+(T* output,
+ const T* data, int height, int width, int numChannels, int size,
+ const T* rois, int numROIs,
+ Geom<T> geom)
+{
+  int outputIndex = threadIdx.x + blockIdx.x * blockDim.x;
+  int outputVolume = geom.subdivisions[0] * geom.subdivisions[1] * numChannels * numROIs;
+  if (outputIndex < outputVolume) {
+    Bounds b = getBounds<T>(outputIndex,
+                            height,width,numChannels,size,
+                            rois,numROIs,
+                            geom) ;
+    data += b.offset ;
+    T bestValue = 0;
+    const T coeff = ((T)1.) / (T)((b.wend-b.wstart) * (b.hend-b.hstart));
+    for (int w = b.wstart; w < b.wend; ++w) {
+      for (int h = b.hstart; h < b.hend; ++h) {
+        int index = w * height + h ;
+        bestValue += data[index] * coeff ;
+      }
+    }
+    output[outputIndex] = bestValue ;
+  }
+}
+
+/* ---------------------------------------------------------------- */
+/*                                           roipooling_max_forward */
+/* ---------------------------------------------------------------- */
+
+template<typename T> __global__ void
+roipooling_max_kernel
+(T* output,
+ const T* data, int height, int width, int numChannels, int size,
+ const T* rois, int numROIs,
+ Geom<T> geom)
+{
+  int outputIndex = threadIdx.x + blockIdx.x * blockDim.x ;
+  int outputVolume = geom.subdivisions[0] * geom.subdivisions[1] * numChannels * numROIs ;
+  if (outputIndex < outputVolume) {
+    Bounds b = getBounds<T>(outputIndex,
+                            height,width,numChannels,size,
+                            rois,numROIs,
+                            geom) ;
+    data += b.offset ;
+    if (! b.isEmpty) {
+      T bestValue = -FLT_MAX;
+      for (int w = b.wstart; w < b.wend; ++w) {
+        for (int h = b.hstart; h < b.hend; ++h) {
+          int index = w * height + h ;
+          bestValue = max(bestValue, data[index]) ;
+        }
+      }
+      output[outputIndex] = bestValue ;
+    } else {
+      output[outputIndex] = 0 ;
+    }
+  }
+}
+
+/* ---------------------------------------------------------------- */
+/*                                                        atomicAdd */
+/* ---------------------------------------------------------------- */
+
+#if !defined(__CUDA_ARCH__) || __CUDA_ARCH__ >= 600
+#else
+// an implementation of atomicAdd() for double (really slow)
+static __device__ double atomicAdd(double* address, double val)
+{
+  unsigned long long int* address_as_ull = (unsigned long long int*)address;
+  unsigned long long int old = *address_as_ull, assumed;
+  do {
+    assumed = old;
+    old = atomicCAS(address_as_ull, assumed,
+                    __double_as_longlong(val +
+                                         __longlong_as_double(assumed)));
+  } while (assumed != old);
+  return __longlong_as_double(old);
+}
+#endif
+
+/* ---------------------------------------------------------------- */
+/*                                      roipooling_average_backward */
+/* ---------------------------------------------------------------- */
+
+template<typename T> __global__ void
+roipooling_average_backward_kernel
+(T* derData,
+ const T* data, int height, int width, int numChannels, int size,
+ const T* rois, int numROIs,
+ const T* derOutput,
+ Geom<T> geom)
+{
+  int outputIndex = threadIdx.x + blockIdx.x * blockDim.x;
+  int outputVolume = geom.subdivisions[0] * geom.subdivisions[1] * numChannels * numROIs ;
+  if (outputIndex < outputVolume) {
+
+    Bounds b = getBounds<T>(outputIndex,
+                            height,width,numChannels,size,
+                            rois,numROIs,
+                            geom) ;
+    data += b.offset ;
+    derData += b.offset ;
+    const T coeff = ((T)1.) / (T)((b.wend-b.wstart)*(b.hend-b.hstart)) ;
+    for (int h = b.hstart; h < b.hend; ++h) {
+      for (int w = b.wstart; w < b.wend; ++w) {
+        int index = w * height + h ;
+        atomicAdd(derData + index, derOutput[outputIndex] * coeff) ;
+      }
+    }
+  }
+}
+
+/* ---------------------------------------------------------------- */
+/*                                          roipooling_max_backward */
+/* ---------------------------------------------------------------- */
+
+template<typename T> __global__ void
+roipooling_max_backward_kernel
+(T* derData,
+ const T* data, int height, int width, int numChannels, int size,
+ const T* rois, int numROIs,
+ const T* derOutput,
+ Geom<T> geom)
+{
+  int outputIndex = threadIdx.x + blockIdx.x * blockDim.x;
+  int outputVolume = geom.subdivisions[0] * geom.subdivisions[1] * numChannels * numROIs;
+
+  if (outputIndex < outputVolume) {
+
+    Bounds b = getBounds<T>(outputIndex,
+                            height,width,numChannels,size,
+                            rois,numROIs,
+                            geom) ;
+    if (! b.isEmpty) {
+      data += b.offset ;
+      derData += b.offset ;
+      int bestIndex = min(b.wstart,width-1) * height + min(b.hstart,height-1);
+      T bestValue = -FLT_MAX;
+      for (int h = b.hstart; h < b.hend; ++h) {
+        for (int w = b.wstart; w < b.wend; ++w) {
+          int index = w * height + h ;
+          T value = data[index] ;
+          if (value > bestValue) {
+            bestValue = value ;
+            bestIndex = index ;
+          }
+        }
+      }
+      atomicAdd(derData + bestIndex, derOutput[outputIndex]) ;
+    }
+  }
+}
+
+/* ---------------------------------------------------------------- */
+/*                                                        Interface */
+/* ---------------------------------------------------------------- */
+
+namespace vl { namespace impl {
+
+  template <typename type>
+  struct roipooling_max<vl::VLDT_GPU, type>
+  {
+    static vl::ErrorCode
+    forward(type* output,
+            type const* data,
+            size_t height, size_t width, size_t numChannels, size_t size,
+            type const* rois,
+            size_t numROIs,
+            int const subdivisions[2],
+            double const transform[6])
+    {
+      int outputVolume = subdivisions[0] * subdivisions[1] * numChannels * numROIs ;
+
+      roipooling_max_kernel<type>
+      <<< divideAndRoundUp(outputVolume, VL_CUDA_NUM_THREADS),VL_CUDA_NUM_THREADS >>>
+      (output,
+       data, height, width, numChannels, size,
+       rois, numROIs,
+       Geom<type>(subdivisions,transform)) ;
+
+      cudaError_t status = cudaPeekAtLastError() ;
+      return (status == cudaSuccess) ? vl::VLE_Success : vl::VLE_Cuda ;
+    }
+
+    static vl::ErrorCode
+    backward(type* derData,
+             type const* data,
+             size_t height, size_t width, size_t numChannels, size_t size,
+             type const* rois,
+             size_t numROIs,
+             type const* derOutput,
+             int const subdivisions[2],
+             double const transform[6])
+    {
+      int outputVolume = subdivisions[0] * subdivisions[1] * numChannels * numROIs ;
+
+      roipooling_max_backward_kernel<type>
+      <<< divideAndRoundUp(outputVolume, VL_CUDA_NUM_THREADS), VL_CUDA_NUM_THREADS >>>
+      (derData, data,
+       height, width, numChannels, size,
+       rois, numROIs,
+       derOutput,
+       Geom<type>(subdivisions,transform)) ;
+
+      cudaError_t status = cudaPeekAtLastError() ;
+      return (status == cudaSuccess) ? vl::VLE_Success : vl::VLE_Cuda ;
+    }
+  } ; // roipooling_max
+
+  template <typename type>
+  struct roipooling_average<vl::VLDT_GPU, type>
+  {
+    static vl::ErrorCode
+    forward(type* output,
+            type const* data,
+            size_t height, size_t width, size_t numChannels, size_t size,
+            type const* rois,
+            size_t numROIs,
+            int const subdivisions[2],
+            double const transform[6])
+    {
+      int outputVolume = subdivisions[0] * subdivisions[1] * numChannels * numROIs ;
+
+      roipooling_average_kernel<type>
+      <<< divideAndRoundUp(outputVolume, VL_CUDA_NUM_THREADS),VL_CUDA_NUM_THREADS >>>
+      (output, data,
+       height, width, numChannels, size,
+       rois, numROIs,
+       Geom<type>(subdivisions,transform)) ;
+
+      cudaError_t status = cudaPeekAtLastError() ;
+      return (status == cudaSuccess) ? vl::VLE_Success : vl::VLE_Cuda ;
+    }
+
+    static vl::ErrorCode
+    backward(type* derData,
+             type const* data, // <- this is not needed for avg pooling
+             size_t height, size_t width, size_t numChannels, size_t size,
+             type const* rois,
+             size_t numROIs,
+             type const* derOutput,
+             int const subdivisions[2],
+             double const transform[6])
+    {
+      int outputVolume = subdivisions[0] * subdivisions[1] * numChannels * numROIs ;
+
+      roipooling_average_backward_kernel<type>
+      <<< divideAndRoundUp(outputVolume, VL_CUDA_NUM_THREADS), VL_CUDA_NUM_THREADS >>>
+      (derData, data,
+       height, width, numChannels, size,
+       rois, numROIs,
+       derOutput,
+       Geom<type>(subdivisions,transform)) ;
+
+      cudaError_t status = cudaPeekAtLastError() ;
+      return (status == cudaSuccess) ? vl::VLE_Success : vl::VLE_Cuda ;
+    }
+  } ; // roipooling_average
+} } ; // namespace vl::impl
+
+// Instantiations
+template struct vl::impl::roipooling_max<vl::VLDT_GPU, float> ;
+template struct vl::impl::roipooling_average<vl::VLDT_GPU, float> ;
+
+#ifdef ENABLE_DOUBLE
+template struct vl::impl::roipooling_max<vl::VLDT_GPU, double> ;
+template struct vl::impl::roipooling_average<vl::VLDT_GPU, double> ;
+#endif
diff --git a/matlab/src/bits/impl/tinythread.h b/matlab/src/bits/impl/tinythread.h
index aed7b585..fce1f068 100644
--- a/matlab/src/bits/impl/tinythread.h
+++ b/matlab/src/bits/impl/tinythread.h
@@ -651,7 +651,7 @@ namespace chrono {
 
       /// Construct a duration object with the given duration.
       template <class _Rep2>
-        explicit duration(const _Rep2& r) : rep_(r) {};
+        explicit duration(const _Rep2& r) : rep_(r) {}
 
       /// Return the value of the duration object.
       rep count() const
diff --git a/matlab/src/bits/mexutils.h b/matlab/src/bits/mexutils.h
index 9a0baaba..f1f24550 100644
--- a/matlab/src/bits/mexutils.h
+++ b/matlab/src/bits/mexutils.h
@@ -24,29 +24,7 @@ the terms of the BSD license (see the COPYING file).
 #include <string.h>
 #include <assert.h>
 
-#if defined(_MSC_VER) && _MSC_VER < 1700
-#define false 0
-#define true 1
-#elif _MSC_VER > 1700
-#include <stdbool.h>
-#endif
-
-#ifdef _MSC_VER
-#define snprintf _snprintf
-#define vsnprintf _vsnprintf
-#ifdef  _WIN64
-typedef signed __int64 ssize_t;
-#else
-typedef signed int ssize_t;
-#endif
-#if _MSC_VER < 1800
-// Add some missing functions from C99
-#define isnan(x) _isnan(x)
-#define isinf(x) (!_finite(x))
-#define round(x) x >= 0.0 ? (double)(int)(x + 0.5f) : (double)(int)(x - 0.5f)
-#define roundf(x) x >= 0.0f ? (float)(int)(x + 0.5f) : (float)(int)(x - 0.5f)
-#endif
-#endif
+#include "impl/compat.h"
 
 #define VL_INLINE static __inline
 
diff --git a/matlab/src/bits/nnnormalize.cu b/matlab/src/bits/nnnormalize.cu
index 4d3e09ca..f7bbe5cf 100644
--- a/matlab/src/bits/nnnormalize.cu
+++ b/matlab/src/bits/nnnormalize.cu
@@ -32,7 +32,7 @@ using namespace vl ;
 error = vl::impl::lrn<deviceType,type>::forward \
 ((type*)output.getMemory(), (type const*)data.getMemory(), \
 data.getHeight(), data.getWidth(), data.getDepth(), data.getSize(), \
-normDetph, kappa, alpha, beta) ;
+normDepth, kappa, alpha, beta) ;
 
 #define DISPATCH2(deviceType) \
 switch (dataType) { \
@@ -45,7 +45,7 @@ vl::ErrorCode
 vl::nnlrn_forward(vl::Context& context,
                   vl::Tensor output,
                   vl::Tensor data,
-                  size_t normDetph,
+                  size_t normDepth,
                   double kappa, double alpha, double beta)
 {
   vl::ErrorCode error = vl::VLE_Success ;
@@ -96,14 +96,14 @@ vl::nnlrn_forward(vl::Context& context,
 error = vl::impl::lrn<deviceType,type>::backward \
 ((type*)derData.getMemory(), (type const*)data.getMemory(), (type const*)derOutput.getMemory(), \
 data.getHeight(), data.getWidth(), data.getDepth(), data.getSize(), \
-normDetph, kappa, alpha, beta) ;
+normDepth, kappa, alpha, beta) ;
 
 vl::ErrorCode
 vl::nnlrn_backward(vl::Context& context,
                    vl::Tensor derData,
                    vl::Tensor data,
                    vl::Tensor derOutput,
-                   size_t normDetph,
+                   size_t normDepth,
                    double kappa, double alpha, double beta)
 {
   vl::ErrorCode error = vl::VLE_Success ;
diff --git a/matlab/src/bits/nnnormalize.hpp b/matlab/src/bits/nnnormalize.hpp
index c0a49d90..da5c6a2b 100644
--- a/matlab/src/bits/nnnormalize.hpp
+++ b/matlab/src/bits/nnnormalize.hpp
@@ -22,7 +22,7 @@ namespace vl {
   nnlrn_forward(vl::Context& context,
                       vl::Tensor output,
                       vl::Tensor data,
-                      size_t normDetph,
+                      size_t normDepth,
                       double kappa, double alpha, double beta) ;
 
   vl::ErrorCode
@@ -30,7 +30,7 @@ namespace vl {
                        vl::Tensor derData,
                        vl::Tensor data,
                        vl::Tensor derOutput,
-                       size_t normDetph,
+                       size_t normDepth,
                        double kappa, double alpha, double beta) ;
 }
 
diff --git a/matlab/src/bits/nnroipooling.cpp b/matlab/src/bits/nnroipooling.cpp
new file mode 100644
index 00000000..01c1b5d1
--- /dev/null
+++ b/matlab/src/bits/nnroipooling.cpp
@@ -0,0 +1,4 @@
+#ifdef ENABLE_GPU
+#error "The file nnroipooling.cu should be compiled instead"
+#endif
+#include "nnroipooling.cu"
diff --git a/matlab/src/bits/nnroipooling.cu b/matlab/src/bits/nnroipooling.cu
new file mode 100644
index 00000000..1399ec46
--- /dev/null
+++ b/matlab/src/bits/nnroipooling.cu
@@ -0,0 +1,151 @@
+// @file nnroipooling.cu
+// @brief roipooling block
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+
+#include "nnroipooling.hpp"
+#include "impl/roipooling.hpp"
+
+#if ENABLE_GPU
+#include "datacu.hpp"
+#endif
+
+#include <assert.h>
+
+using namespace vl ;
+
+/* ---------------------------------------------------------------- */
+/*                                             nnroipooling_forward */
+/* ---------------------------------------------------------------- */
+
+#define DISPATCH(deviceType, op, type) \
+status = vl::impl::op<deviceType, type>::forward \
+((type*)output.getMemory(), (type const*)data.getMemory(), \
+data.getHeight(), data.getWidth(), data.getDepth(), data.getSize(), \
+(type const *)rois.getMemory(), rois.getNumElements() / 5, \
+subdivisions, transform) ;
+
+#define DISPATCH2(deviceType, op) \
+switch (dataType) { \
+case VLDT_Float : DISPATCH(deviceType, op, float) ; break ; \
+IF_DOUBLE(case VLDT_Double : DISPATCH(deviceType, op, double) ; break ;) \
+default: assert(false) ; return VLE_Unknown ; \
+}
+
+#define DISPATCH3(deviceType) \
+switch (method) { \
+case vlROIPoolingAverage : DISPATCH2(deviceType, roipooling_average) ; break ; \
+case vlROIPoolingMax : DISPATCH2(deviceType, roipooling_max) ; break ; \
+default: assert(false) ; return VLE_Unknown ; \
+}
+
+vl::ErrorCode
+vl::nnroipooling_forward(vl::Context& context,
+                         vl::Tensor output,
+                         vl::Tensor data,
+                         vl::Tensor rois,
+                         ROIPoolingMethod method,
+                         int const subdivisions[2],
+                         double const transform[6])
+{
+  vl::ErrorCode status = VLE_Success ;
+  vl::DeviceType deviceType = output.getDeviceType() ;
+  vl::DataType dataType = output.getDataType() ;
+  switch (deviceType) {
+    default:
+      assert(false) ;
+      return vl::VLE_Unknown ;
+
+    case vl::VLDT_CPU:
+      DISPATCH3(vl::VLDT_CPU) ;
+      break ;
+
+#ifdef ENABLE_GPU
+    case vl::VLDT_GPU:
+      DISPATCH3(vl::VLDT_GPU) ;
+      if (status == vl::VLE_Cuda) {
+        context.setError(context.getCudaHelper().catchCudaError(__func__)) ;
+      }
+      break ;
+#endif
+  }
+  return context.passError(status, "nnroipooling_forward") ;
+}
+
+/* ---------------------------------------------------------------- */
+/*                                            nnroipooling_backward */
+/* ---------------------------------------------------------------- */
+
+#undef DISPATCH
+#undef DISPATCH2
+
+// backward max and average want slightly differet argument lists
+
+#define DISPATCH_roipooling_average(deviceType, type) \
+status = vl::impl::roipooling_average<deviceType, type>::backward \
+((type*)derData.getMemory(), (type const*)data.getMemory(), \
+derData.getHeight(), derData.getWidth(), derData.getDepth(), derData.getSize(), \
+(const type *)rois.getMemory(), rois.getNumElements() / 5, \
+(type const*)derOutput.getMemory(), \
+subdivisions, transform) ;
+
+#define DISPATCH_roipooling_max(deviceType, type) \
+status = vl::impl::roipooling_max<deviceType, type>::backward \
+((type*)derData.getMemory(), (type const*)data.getMemory(), \
+derData.getHeight(), derData.getWidth(), derData.getDepth(), derData.getSize(), \
+(const type *)rois.getMemory(), rois.getNumElements() / 5, \
+(type const*)derOutput.getMemory(), \
+subdivisions, transform) ;
+
+#define DISPATCH2(deviceType, op) \
+switch (dataType) { \
+case VLDT_Float : DISPATCH_ ## op (deviceType, float) ; break ; \
+IF_DOUBLE(case VLDT_Double : DISPATCH_ ## op (deviceType, double) ; break ;) \
+default: assert(false) ; return vl::VLE_Unknown ; \
+}
+
+vl::ErrorCode
+vl::nnroipooling_backward(vl::Context& context,
+                          vl::Tensor derData,
+                          vl::Tensor data,
+                          vl::Tensor rois,
+                          vl::Tensor derOutput,
+                          ROIPoolingMethod method,
+                          int const subdivisions[2],
+                          double const transform[6])
+{
+  vl::ErrorCode status = VLE_Success ;
+  vl::DeviceType deviceType = derOutput.getDeviceType() ;
+  vl::DataType dataType = derOutput.getDataType() ;
+
+  switch (deviceType) {
+    default:
+      assert(false) ;
+      return vl::VLE_Unknown ;
+
+    case vl::VLDT_CPU:
+      DISPATCH3(vl::VLDT_CPU) ;
+      break ;
+
+#if ENABLE_GPU
+    case vl::VLDT_GPU:
+      DISPATCH3(vl::VLDT_GPU) ;
+      if (status == vl::VLE_Cuda) {
+        context.setError(context.getCudaHelper().catchCudaError(__func__)) ;
+      }
+      break ;
+#endif
+  }
+
+  return context.passError(status, "nnroipooling_backward") ;
+}
diff --git a/matlab/src/bits/nnroipooling.hpp b/matlab/src/bits/nnroipooling.hpp
new file mode 100644
index 00000000..e6c68b12
--- /dev/null
+++ b/matlab/src/bits/nnroipooling.hpp
@@ -0,0 +1,43 @@
+// @file nnroipooling.hpp
+// @brief Spatial Pyramid block
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+#ifndef __vl__nnroipooling__
+#define __vl__nnroipooling__
+
+#include "data.hpp"
+#include <stdio.h>
+
+namespace vl {
+  enum ROIPoolingMethod { vlROIPoolingMax, vlROIPoolingAverage } ;
+
+  vl::ErrorCode
+  nnroipooling_forward(vl::Context& context,
+                       vl::Tensor output,
+                       vl::Tensor data,
+                       vl::Tensor rois,
+                       ROIPoolingMethod method,
+                       int const subdivisions[2],
+                       double const transform[6]) ;
+
+  vl::ErrorCode
+  nnroipooling_backward(vl::Context& context,
+                        vl::Tensor derData,
+                        vl::Tensor data,
+                        vl::Tensor rois,
+                        vl::Tensor derOutput,
+                        ROIPoolingMethod method,
+                        int const subdivisions[2],
+                        double const transform[6]) ;
+}
+
+#endif /* defined(__vl__nnroipooling__) */
diff --git a/matlab/src/config/mex_CUDA_glnxa64.xml b/matlab/src/config/mex_CUDA_glnxa64.xml
index f4fa87c6..0b657c68 100644
--- a/matlab/src/config/mex_CUDA_glnxa64.xml
+++ b/matlab/src/config/mex_CUDA_glnxa64.xml
@@ -31,7 +31,7 @@
           CXX="$NVCC"
           DEFINES="--compiler-options=-D_GNU_SOURCE,$MATLABMEX"
           MATLABMEX="-DMATLAB_MEX_FILE"
-          NVCCFLAGS="-gencode=arch=compute_20,code=sm_20 -gencode=arch=compute_30,code=&#92;&quot;sm_30,compute_30&#92;&quot; $NVCC_FLAGS"
+          NVCCFLAGS="-D_FORCE_INLINES -gencode=arch=compute_20,code=sm_20 -gencode=arch=compute_30,code=&#92;&quot;sm_30,compute_30&#92;&quot; $NVCC_FLAGS"
           CXXFLAGS="--compiler-options=-ansi,-fexceptions,-fPIC,-fno-omit-frame-pointer,-pthread"
           INCLUDE="-I&quot;$MATLABROOT/extern/include&quot; -I&quot;$MATLABROOT/simulink/include&quot; -I&quot;$MATLABROOT/toolbox/distcomp/gpu/extern/include/&quot;"
           CXXOPTIMFLAGS="-O -DNDEBUG"
diff --git a/matlab/src/vl_imreadjpeg.cu b/matlab/src/vl_imreadjpeg.cu
index beab19bd..b99650a9 100644
--- a/matlab/src/vl_imreadjpeg.cu
+++ b/matlab/src/vl_imreadjpeg.cu
@@ -27,11 +27,6 @@ the terms of the BSD license (see the COPYING file).
 #include "bits/datamex.hpp"
 #include "bits/mexutils.h"
 
-#ifdef _MSC_VER
-#undef max
-#undef min
-#endif
-
 static int verbosity = 0 ;
 
 /* option codes */
@@ -1330,7 +1325,6 @@ void mexFunction(int nout, mxArray *out[],
         } else {
           vlmxError(VLMXE_IllegalArgument, "INTERPOLATION is not a supported method.") ;
         }
-        break;
         break ;
       }
     }
@@ -1410,6 +1404,8 @@ void mexFunction(int nout, mxArray *out[],
                 minCropAnisotropy, maxCropAnisotropy) ;
       mexPrintf("vl_imreadjpeg: crop size: [%.1g, %.1g]\n",
                 minCropSize, maxCropSize) ;
+      mexPrintf("vl_imreadjpeg: num_threads: %d requested %d readers\n",
+                requestedNumThreads, readers.size());
     }
 
 
diff --git a/matlab/src/vl_nnroipool.cpp b/matlab/src/vl_nnroipool.cpp
new file mode 100644
index 00000000..ff268ea7
--- /dev/null
+++ b/matlab/src/vl_nnroipool.cpp
@@ -0,0 +1,4 @@
+#if ENABLE_GPU
+#error This file should not be compiled with GPU support enabled
+#endif
+#include "vl_nnroipool.cu"
diff --git a/matlab/src/vl_nnroipool.cu b/matlab/src/vl_nnroipool.cu
new file mode 100644
index 00000000..400be852
--- /dev/null
+++ b/matlab/src/vl_nnroipool.cu
@@ -0,0 +1,276 @@
+// @file vl_nnroipooling.cpp
+// @brief roipooling block implementation (GPU)
+// @author Hakan Bilen
+// @author Abishek Dutta
+// @author Andrea Vedaldi
+
+/*
+Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+All rights reserved.
+
+This file is part of the VLFeat library and is made available under
+the terms of the BSD license (see the COPYING file).
+*/
+
+#include "bits/mexutils.h"
+#include "bits/datamex.hpp"
+#include "bits/nnroipooling.hpp"
+
+#if ENABLE_GPU
+#include "bits/datacu.hpp"
+#endif
+
+#include <assert.h>
+#include <algorithm>
+
+/* option codes */
+enum {
+  opt_method = 0,
+  opt_subdivisions,
+  opt_transform,
+  opt_verbose,
+} ;
+
+/* options */
+VLMXOption  options [] = {
+  {"Method",           1,   opt_method       },
+  {"Subdivisions",     1,   opt_subdivisions },
+  {"Transform",        1,   opt_transform    },
+  {"Verbose",          0,   opt_verbose      },
+  {0,                  0,   0                }
+} ;
+
+/* ---------------------------------------------------------------- */
+/*                                                          Context */
+/* ---------------------------------------------------------------- */
+
+vl::MexContext context ;
+
+/*
+ Resetting the context here resolves a crash when MATLAB quits and
+ the ~Context function is implicitly called on unloading the MEX file.
+ */
+void atExit()
+{
+  context.clear() ;
+}
+
+/* ---------------------------------------------------------------- */
+/*                                                       MEX driver */
+/* ---------------------------------------------------------------- */
+
+enum {
+  IN_DATA = 0, IN_ROIS, IN_DEROUTPUT, IN_END
+} ;
+
+enum {
+  OUT_RESULT = 0, OUT_END
+} ;
+
+void mexFunction(int nout, mxArray *out[],
+                 int nin, mxArray const *in[])
+{
+  int subdivisions [] = {1, 1} ;
+  double transform [] = {1., 0., 0., 1., 0., 0.} ;
+  vl::ROIPoolingMethod method = vl::vlROIPoolingMax ;
+  bool backMode = false ;
+  int verbosity = 0 ;
+  int opt ;
+  int next = IN_END ;
+  mxArray const *optarg ;
+
+  /* -------------------------------------------------------------- */
+  /*                                            Check the arguments */
+  /* -------------------------------------------------------------- */
+
+  mexAtExit(atExit) ;
+
+  if (nin < 2) {
+    vlmxError(VLMXE_IllegalArgument, "There are less than two arguments.") ;
+  }
+
+  if (nin > 2 && vlmxIsString(in[2],-1)) {
+    next = 2 ;
+    backMode = 0 ;
+  } else {
+    backMode = (nin >= 3) ;
+  }
+
+  while ((opt = vlmxNextOption (in, nin, options, &next, &optarg)) >= 0) {
+    switch (opt) {
+      case opt_verbose : {
+        ++ verbosity ;
+        break ;
+      }
+
+      case opt_method : {
+        if (!vlmxIsString(optarg,-1)) {
+          vlmxError(VLMXE_IllegalArgument, "METHOD is not a string.") ;
+        }
+        if (vlmxIsEqualToStringI(optarg, "max")) {
+          method = vl::vlROIPoolingMax ;
+        } else if (vlmxIsEqualToStringI(optarg, "avg")) {
+          method = vl::vlROIPoolingAverage ;
+        } else {
+          vlmxError(VLMXE_IllegalArgument, "METHOD is not a supported method.") ;
+        }
+        break ;
+      }
+
+      case opt_subdivisions : {
+        if (!vlmxIsPlainMatrix(optarg,-1,-1)) {
+          vlmxError(VLMXE_IllegalArgument, "SUBDIVISIONS is not a plain matrix.") ;
+        }
+        switch (mxGetNumberOfElements(optarg)) {
+          case 1:
+            subdivisions[0] = mxGetPr(optarg)[0] ;
+            subdivisions[1] = mxGetPr(optarg)[0] ;
+
+          case 2:
+            subdivisions[0] = mxGetPr(optarg)[0] ;
+            subdivisions[1] = mxGetPr(optarg)[1] ;
+            break ;
+
+          default:
+            vlmxError(VLMXE_IllegalArgument, "SUBDIVISIONS does not have one or two elements.") ;
+            break ;
+        }
+        if (subdivisions[0] < 1 || subdivisions[1] < 1) {
+          vlmxError(VLMXE_IllegalArgument, "SUBDIVISIONS has an element smaller than 1.") ;
+        }
+        break ;
+      }
+
+      case opt_transform : {
+        if (!vlmxIsPlainMatrix(optarg,-1,-1)) {
+          vlmxError(VLMXE_IllegalArgument, "TRANSFORM is not a plain matrix.") ;
+        }
+        int n = (int) mxGetNumberOfElements(optarg) ;
+        switch (n) {
+          case 1: case 2:
+            transform[0] = mxGetPr(optarg)[std::min(n - 1, 0)] ;
+            transform[3] = mxGetPr(optarg)[std::min(n - 1, 1)] ;
+            transform[4] = 1. - transform[0] ;
+            transform[5] = 1. - transform[3] ;
+            break ;
+
+          case 6:
+            memcpy(transform, mxGetPr(optarg), 6 * sizeof(transform[0])) ;
+            break ;
+
+          default:
+            vlmxError(VLMXE_IllegalArgument, "TRANSFORM is neither a 1 x 1, 2 x 1, or 2 x 3 matrix.") ;
+        }
+        break ;
+      }
+
+      default:
+        break ;
+    }
+  }
+
+  vl::MexTensor data(context) ;
+  vl::MexTensor derOutput(context) ;
+  vl::MexTensor rois(context) ;
+
+  /* Get data */
+  rois.init(in[IN_ROIS]);
+  data.init(in[IN_DATA]) ;
+  if (backMode) { derOutput.init(in[IN_DEROUTPUT]) ; }
+
+  if (backMode && ! vl::areCompatible(data, derOutput)) {
+    vlmxError(VLMXE_IllegalArgument, "DATA and DEROUTPUT do not have compatible formats.") ;
+  }
+
+  size_t numROIs = rois.getNumElements() / 5 ;
+
+  if (! vl::areCompatible(data, rois)) {
+    vlmxError(VLMXE_IllegalArgument, "DATA and ROI do not have compatible formats.") ;
+  }
+
+  if (rois.getNumElements() != numROIs * 5 || numROIs == 0) {
+    vlmxError(VLMXE_IllegalArgument, "ROI is not a 5 x K array with K >= 1.") ;
+  }
+  rois.reshape(vl::TensorShape(1, 1, 5, numROIs)) ;
+
+  vl::TensorShape dataShape = data.getShape();
+  dataShape.reshape(4);
+
+  /* Get the output geometry */
+  vl::TensorShape outputShape(subdivisions[0],
+                              subdivisions[1],
+                              dataShape.getDepth(),
+                              numROIs) ;
+
+  vl::TensorShape derOutputShape = derOutput.getShape();
+  /* in case there is only one roi */ 
+  derOutputShape.reshape(4);
+
+  if (backMode) {
+    if (derOutputShape != outputShape) {
+      vlmxError(VLMXE_IllegalArgument, "The shape of DEROUTPUT is incorrect.") ;
+    }
+  }
+
+  /* Create output buffers */
+  vl::DeviceType deviceType = data.getDeviceType() ;
+  vl::DataType dataType = data.getDataType() ;
+  vl::MexTensor output(context) ;
+  vl::MexTensor derData(context) ;
+
+  if (!backMode) {
+    output.initWithZeros(deviceType, dataType, outputShape) ;
+  } else {
+    derData.initWithZeros(deviceType, dataType, dataShape) ;
+  }
+
+  if (verbosity > 0) {
+    mexPrintf("vl_nnroipool: %s; %s", backMode?"backward":"forward", (data.getDeviceType()==vl::VLDT_GPU) ? "GPU" : "CPU") ;
+    mexPrintf("\nvl_nnroipool: method: %d; num ROIs: %d\n", method, numROIs);
+    mexPrintf("vl_nnroipool: subdivisions: [%d x %d]\n", subdivisions[0], subdivisions[1]) ;
+    mexPrintf("vl_nnroipool: transform: [%g %g %g ; %g %g %g]\n",
+              transform[0], transform[2], transform[4],
+              transform[1], transform[3], transform[5]) ;
+
+    vl::print("vl_nnroipool: data: ", data) ;
+    if (backMode) {
+      vl::print("vl_nnroipool: derOutput: ", derOutput) ;
+      vl::print("vl_nnroipool: derData: ", derData) ;
+    } else {
+      vl::print("vl_nnroipool: output: ", output) ;
+      vl::print("vl_nnroipool: rois: ", rois) ;
+    }
+  }
+
+  /* -------------------------------------------------------------- */
+  /*                                                    Do the work */
+  /* -------------------------------------------------------------- */
+
+  vl::ErrorCode error ;
+  if (!backMode) {
+    error = vl::nnroipooling_forward(context,
+                                     output, data, rois,
+                                     method,
+                                     subdivisions,
+                                     transform) ;
+  } else {
+    error = vl::nnroipooling_backward(context,
+                                      derData, data, rois, derOutput,
+                                      method,
+                                      subdivisions,
+                                      transform) ;
+  }
+
+  /* -------------------------------------------------------------- */
+  /*                                                         Finish */
+  /* -------------------------------------------------------------- */
+
+  if (error != vl::VLE_Success) {
+    vlmxError(VLMXE_IllegalArgument, context.getLastErrorMessage().c_str()) ;
+  }
+  if (backMode) {
+    out[OUT_RESULT] = derData.relinquish() ;
+  } else {
+    out[OUT_RESULT] = output.relinquish() ;
+  }
+}
diff --git a/matlab/vl_argparse.m b/matlab/vl_argparse.m
index 3c08013b..19e6f307 100644
--- a/matlab/vl_argparse.m
+++ b/matlab/vl_argparse.m
@@ -19,11 +19,22 @@
 %   values. This behaviour, while orthogonal to structure-valued parameters,
 %   is also disabled in the 'nonrecursive' mode.
 %
+%   A shorthand notation for substructs is available: the pair
+%   ('field.subfield', value) creates a substruct, i.e. ('field',
+%   struct('subfield', value)). It also works recursively (sub-sub-fields).
+%
 %   [OPTS, ARGS] = VL_ARGPARSE(OPTS, ARGS) copies any parameter in
 %   ARGS that does not match OPTS back to ARGS instead of producing an
 %   error. Options specified as structures are passed back as a list
 %   of (PAR, VAL) pairs.
 %
+%   A further option is VL_ARGPARSE(OPTS, ARGS, 'merge'), which merges any
+%   parameter in ARGS that do not match OPTS into OPTS. This essentially
+%   turns off errors for unknown options, merging them anyway, and is
+%   useful if OPTS does not necessarily define all possible default values.
+%   The second output argument will always be empty. Another view is that
+%   VL_ARGPARSE(OPTS1, OPTS2, 'merge') merges two structs into one.
+%
 %   Example::
 %     The function can be used to parse a list of arguments
 %     passed to a MATLAB functions:
@@ -53,15 +64,21 @@
 if ~iscell(args), args = {args} ; end
 
 recursive = true ;
-if numel(varargin) == 1
-  if strcmp(lower(varargin{1}), 'nonrecursive') ;
-    recursive = false ;
-  else
-    error('Unknown option specified.') ;
-  end
+merge = false ;
+
+if numel(varargin) > 2
+  error('There can be at most two options.') ;
 end
-if numel(varargin) > 1
-  error('There can be at most one option.') ;
+
+for i = 1:numel(varargin)
+  switch lower(varargin{i})
+    case 'nonrecursive'
+      recursive = false ;
+    case 'merge'
+      merge = true ;
+    otherwise
+      error('Unknown option specified.') ;
+  end
 end
 
 optNames = fieldnames(opts)' ;
@@ -75,10 +92,10 @@
   if recursive && isstruct(args{ai})
     params = fieldnames(args{ai})' ;
     values = struct2cell(args{ai})' ;
-    if nargout == 1
-      opts = vl_argparse(opts, vertcat(params,values)) ;
+    if nargout <= 1
+      opts = vl_argparse(opts, vertcat(params,values), varargin{:}) ;
     else
-      [opts, rest] = vl_argparse(opts, reshape(vertcat(params,values), 1, [])) ;
+      [opts, rest] = vl_argparse(opts, reshape(vertcat(params,values), 1, []), varargin{:}) ;
       args{ai} = cell2struct(rest(2:2:end), rest(1:2:end), 2) ;
       keep(ai) = true ;
     end
@@ -92,23 +109,35 @@
 
   param = args{ai} ;
   value = args{ai+1} ;
+  
+  if any(param == '.')
+    % Handy notation for substructs: convert {'train.learningRate', value}
+    % to {'train', struct('learningRate', value)}. Nested structs also work
+    parts = strsplit(param, '.') ;
+    subs = struct('type', repmat({'.'}, 1, numel(parts) - 1), 'subs', parts(2:end)) ;
+    param = parts{1} ;
+    value = subsasgn(struct(), subs, value) ;
+  end
 
   p = find(strcmpi(param, optNames)) ;
   if numel(p) ~= 1
-    if nargout == 1
+    if merge  % Merge unknown fields, instead of erroring or leaving it
+      field = param ;
+    elseif nargout <= 1
       error('Unknown parameter ''%s''', param) ;
     else
       keep([ai,ai+1]) = true ;
       ai = ai + 2 ;
       continue ;
     end
+  else
+    field = optNames{p} ;
   end
-  field = optNames{p} ;
 
   if ~recursive
     opts.(field) = value ;
   else
-    if isstruct(opts.(field)) && numel(fieldnames(opts.(field))) > 0
+    if isfield(opts, field) && isstruct(opts.(field)) && numel(fieldnames(opts.(field))) > 0
       % The parameter has a  non-empty struct value in OPTS:
       % process recursively.
       if ~isstruct(value)
@@ -116,9 +145,9 @@
           field) ;
       end
       if nargout > 1
-        [opts.(field), args{ai+1}] = vl_argparse(opts.(field), value) ;
+        [opts.(field), args{ai+1}] = vl_argparse(opts.(field), value, varargin{:}) ;
       else
-        opts.(field) = vl_argparse(opts.(field), value) ;
+        opts.(field) = vl_argparse(opts.(field), value, varargin{:}) ;
       end
     else
       % The parameter does not have a struct value in OPTS: copy as is.
diff --git a/matlab/vl_compilenn.m b/matlab/vl_compilenn.m
index 38d38021..d0391aa6 100644
--- a/matlab/vl_compilenn.m
+++ b/matlab/vl_compilenn.m
@@ -202,12 +202,14 @@ function vl_compilenn(varargin)
 lib_src{end+1} = fullfile(root,'matlab','src','bits',['nnbnorm.' ext]) ;
 lib_src{end+1} = fullfile(root,'matlab','src','bits',['nnbias.' ext]) ;
 lib_src{end+1} = fullfile(root,'matlab','src','bits',['nnbilinearsampler.' ext]) ;
+lib_src{end+1} = fullfile(root,'matlab','src','bits',['nnroipooling.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnconv.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnconvt.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnpool.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnnormalize.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnbnorm.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnbilinearsampler.' ext]) ;
+mex_src{end+1} = fullfile(root,'matlab','src',['vl_nnroipool.' ext]) ;
 mex_src{end+1} = fullfile(root,'matlab','src',['vl_taccummex.' ext]) ;
 switch arch
   case {'glnxa64','maci64'}
@@ -224,6 +226,7 @@ function vl_compilenn(varargin)
 lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','bnorm_cpu.cpp') ;
 lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','tinythread.cpp') ;
 lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','bilinearsampler_cpu.cpp') ;
+lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','roipooling_cpu.cpp') ;
 lib_src{end+1} = fullfile(root,'matlab','src','bits','imread.cpp') ;
 
 % GPU-specific files
@@ -235,6 +238,7 @@ function vl_compilenn(varargin)
   lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','normalize_gpu.cu') ;
   lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','bnorm_gpu.cu') ;
   lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','bilinearsampler_gpu.cu') ;
+  lib_src{end+1} = fullfile(root,'matlab','src','bits','impl','roipooling_gpu.cu') ;
   lib_src{end+1} = fullfile(root,'matlab','src','bits','datacu.cu') ;
   mex_src{end+1} = fullfile(root,'matlab','src','vl_cudatool.cu') ;
 end
@@ -435,7 +439,7 @@ function vl_compilenn(varargin)
 flags.mexlink = horzcat(flags.cc, flags.link, ...
                         {'-largeArrayDims'}, ...
                         {['LDFLAGS=$LDFLAGS ', strjoin(flags.linkpass)]}, ...
-                        {['LINKLIBS=$LINKLIBS ', strjoin(flags.linklibs)]}) ;
+                        {['LINKLIBS=', strjoin(flags.linklibs), ' $LINKLIBS']}) ;
 
 % nvcc: compile GPU
 flags.nvcc = horzcat(flags.cc, ...
diff --git a/matlab/vl_imreadjpeg.m b/matlab/vl_imreadjpeg.m
index 9e44256a..bc9b0517 100644
--- a/matlab/vl_imreadjpeg.m
+++ b/matlab/vl_imreadjpeg.m
@@ -15,7 +15,7 @@
 %   MATLAB is busy doing something else.
 %
 %   The function can transforms the images on the fly in various
-%   ways. Transformatiosn are applied as follows:
+%   ways. Transformations are applied as follows:
 %
 %   1) An (H,W) image is loaded from disk.
 %
@@ -25,10 +25,9 @@
 %      1) First, the shape (Ho,Wo) of the output image (i.e. the
 %         resized crop) is determined. This, as determined by the
 %         `Resize` option, can be either the same as the input image
-%         (H,W) or one or both of height and witdth can be set to an
+%         (H,W) or one or both of height and width can be set to an
 %         arbitrary value.
 %
-
 %      2) Given the output shape (Ho,Wo) of the crop, the shape
 %         (Hi,Wi) and location of the crop in the input image is
 %         determined.  First, an anisotropy ratio (change in aspect
@@ -39,10 +38,10 @@
 %         input image or at a random location according to
 %         `CropLocation`.
 %
-%   3) The cropedd and resized image undergoes color post
+%   3) The cropped and resized image undergoes color post
 %      post-processing, including mean subtraction
 %      (`SubtractAverage`), random color shift (`Brightness`), and
-%      random changes in saturation (`Saturation`), and contrats
+%      random changes in saturation (`Saturation`), and contrast
 %      (`Contrast`).
 %
 %   The function takes the following options:
diff --git a/matlab/vl_nnbilinearsampler.m b/matlab/vl_nnbilinearsampler.m
index b7228acc..ef182760 100644
--- a/matlab/vl_nnbilinearsampler.m
+++ b/matlab/vl_nnbilinearsampler.m
@@ -27,7 +27,7 @@
 %      MatConvNet (as these could be interpreted as 'channels' in
 %      GRID).
 %
-%   Furthre, No can be a multiple of N; in this case, it is assumed
+%   Further, No can be a multiple of N; in this case, it is assumed
 %   that there are No/N transforms per input image, hence, the
 %   transforms [1 ... No/N] are applied to the first image, [No/N+1
 %   ... 2*No/N] are applied to the second image, etc.
diff --git a/matlab/vl_nndropout.m b/matlab/vl_nndropout.m
index 43b0f801..d1b601eb 100644
--- a/matlab/vl_nndropout.m
+++ b/matlab/vl_nndropout.m
@@ -5,8 +5,8 @@
 %   same size as X.
 %
 %   VL_NNDROPOUT(X, 'rate', R) sets the dropout rate to R. Rate is defined
-%   as a probability of a variable *not* to be zeroed (i.e. it is the
-%   expected value of MASK).
+%   as the probability that a variable will be zeroed (i.e. it is one 
+%   minus the expected value of MASK).
 %
 %   [DZDX] = VL_NNDROPOUT(X, DZDY, 'mask', MASK) computes the
 %   derivatives of the blocks projected onto DZDY. Note that MASK must
diff --git a/matlab/vl_nnloss.m b/matlab/vl_nnloss.m
index 20c4f499..3343d06f 100644
--- a/matlab/vl_nnloss.m
+++ b/matlab/vl_nnloss.m
@@ -1,4 +1,4 @@
-function y = vl_nnloss(x,c,dzdy,varargin)
+function y = vl_nnloss(x,c,varargin)
 %VL_NNLOSS CNN categorical or attribute loss.
 %   Y = VL_NNLOSS(X, C) computes the loss incurred by the prediction
 %   scores X given the categorical labels C.
@@ -89,7 +89,7 @@
 %     a number in the range [0,1]. This is the binary version of the
 %     `log` loss.
 %
-%   Logistic log loss:: `logisticlog`
+%   Logistic log loss:: `logistic`
 %     L(x,c) = log(1 + exp(- cx)). This is the same as the `binarylog`
 %     loss, but implicitly normalizes the score x into a probability
 %     using the logistic (sigmoid) function: p = sigmoid(x) = 1 / (1 +
@@ -126,6 +126,13 @@
 % This file is part of the VLFeat library and is made available under
 % the terms of the BSD license (see the COPYING file).
 
+if ~isempty(varargin) && ~ischar(varargin{1})  % passed in dzdy
+  dzdy = varargin{1} ;
+  varargin(1) = [] ;
+else
+  dzdy = [] ;
+end
+
 opts.instanceWeights = [] ;
 opts.classWeights = [] ;
 opts.threshold = 0 ;
diff --git a/matlab/vl_nnpdist.m b/matlab/vl_nnpdist.m
index 4ed2184d..6c1a4914 100644
--- a/matlab/vl_nnpdist.m
+++ b/matlab/vl_nnpdist.m
@@ -126,7 +126,7 @@
     y1 = bsxfun(@times, opts.instanceWeights, y1) ;
   end
   if opts.aggregate
-    y1 = sum(sum(y1)) ;
+    y1 = sum(y1(:)) ;
   end
 end
 if ~isempty(dzdy), y2 = -y1; end
diff --git a/matlab/vl_nnpool.m b/matlab/vl_nnpool.m
index abe1409f..65f6aa0f 100644
--- a/matlab/vl_nnpool.m
+++ b/matlab/vl_nnpool.m
@@ -12,7 +12,7 @@
 %   block projected onto DZDY. DZDX and DZDY have the same dimensions
 %   as X and Y respectively.
 %
-%   VL_NNCONV(..., 'option', value, ...) takes the following options:
+%   VL_NNPOOL(..., 'option', value, ...) takes the following options:
 %
 %   `Stride`:: 1
 %     The output stride (downsampling factor). It can be either a
@@ -24,12 +24,12 @@
 %     by this number of pixels on all sides before the convolution is
 %     computed. It can also be a vector [TOP BOTTOM LEFT RIGHT] to
 %     specify a different amount of padding in each direction. The
-%     size of the poolin filter has to exceed the padding.
+%     size of the pooling filter has to exceed the padding.
 %
 %   `Method`:: 'max'
 %     Specify method of pooling. It can be either 'max' (retain max value
 %     over the pooling region per channel) or 'avg' (compute the average
-%     value over the poolling region per channel).
+%     value over the pooling region per channel).
 %
 %   The pooling window must be not larger than the padded image, i.e.
 %
@@ -49,7 +49,7 @@
 %
 %   If compiled in, the function will use cuDNN convolution routines
 %   (with the exception of asymmetric left-right or top-bottom
-%   padding and avergage pooling that triggers a bug in cuDNN). You
+%   padding and average pooling that triggers a bug in cuDNN). You
 %   can use the 'NoCuDNN' option to disable cuDNN or 'cuDNN' to
 %   activate it back again (the choice sticks until MATLAB purges the
 %   MEX files for any reason).
diff --git a/matlab/vl_nnrelu.m b/matlab/vl_nnrelu.m
index cfc5950e..c8d53b2d 100644
--- a/matlab/vl_nnrelu.m
+++ b/matlab/vl_nnrelu.m
@@ -1,4 +1,4 @@
-function y = vl_nnrelu(x,dzdy,varargin)
+function y = vl_nnrelu(x,varargin)
 %VL_NNRELU CNN rectified linear unit.
 %   Y = VL_NNRELU(X) applies the rectified linear unit to the data
 %   X. X can have arbitrary size.
@@ -30,6 +30,13 @@
 % This file is part of the VLFeat library and is made available under
 % the terms of the BSD license (see the COPYING file).
 
+if ~isempty(varargin) && ~ischar(varargin{1})  % passed in dzdy
+  dzdy = varargin{1} ;
+  varargin(1) = [] ;
+else
+  dzdy = [] ;
+end
+
 opts.leak = 0 ;
 opts = vl_argparse(opts, varargin, 'nonrecursive') ;
 
diff --git a/matlab/vl_nnroipool.m b/matlab/vl_nnroipool.m
new file mode 100644
index 00000000..b283ad2e
--- /dev/null
+++ b/matlab/vl_nnroipool.m
@@ -0,0 +1,56 @@
+% VL_NNROIPOOL  CNN region of interest pooling.
+%   Y = VL_NNROIPOOL(X, ROIS) pools each feature channel in X in
+%   the specified regions of interest ROIS. ROIS is a 5 x K array
+%   containing K regions. Each region has five coordinates `[t, u0,
+%   v0, u1, v1]` where `u0`, `v0` is the upper-left corner of a ROI,
+%   `u1`, `v1` is the bottom-right corner, and `t` is the index of the
+%   image that contains the region. Spatial coordiantes start at (1,1),
+%   with `u` indexing the horizontal axis and `v` the vertical one.
+%   The image indeces ranges from 1 to the number of images stored
+%   in the tensor X.
+%
+%   If X has C feature channels, then the output Y is a 1 x 1 x C x K
+%   array, with one image instance per region. Arguments can be SINGLE
+%   or DOUBLE and CPU or GPU arrays; however, they must all be of the
+%   same type (unless empty).
+%
+%   DZDX = VL_NNROIPOOL(X, ROIS, DZDY) computes the derivative of
+%   the layer projected on DZDY with respect to X.
+%
+%   VL_NNROIPOOL(___, 'opt', value, ...) accepts the following
+%   options:
+%
+%   `Method`:: `'max'`
+%     Choose between `'max'` and `'avg'` (average) pooling.
+%
+%   `Subdivisions`:: `[1 1]`
+%     Specifies the number [SH,SW] of vertical and horizontal tiles of
+%     a region. This makes the output a SH x SW x C x K array.
+%
+%   `Transform`:: `1`
+%     Specifies a spatial transformation to apply to region vertices before
+%     they are applied to the input tensor. If T is a scalar, then
+%     the transformation is a scaling centered at the origin:
+%
+%        u' = T (u - 1) + 1,
+%        v' = T (v - 1) + 1.
+%
+%     If T is a 2D vector, then different scaling factors for the
+%     `u` and `v` can be specified. Finally, if T is a 2 x 2 matrix, then:
+%
+%        u' = T(1,1) u + T(1,2) v + T(1,3),
+%        v' = T(2,1) u + T(2,2) v + T(2,3).
+%
+%     Note that only the upper-left and bottom-right corners of each
+%     rectangular region are transformed. Thus this is mostly useful
+%     for axis-aligned transformations; the generality of the expression
+%     allows, however, to swap `u` and `v`, which may be needed
+%     to match different conventions for the box coordiantes.
+%
+%   See also: VL_NNPOOL().
+
+% Copyright (C) 2016 Hakan Bilen, Abishek Dutta, and Andrea Vedaldi.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
diff --git a/matlab/vl_taccum.m b/matlab/vl_taccum.m
index edde59c3..d316539d 100644
--- a/matlab/vl_taccum.m
+++ b/matlab/vl_taccum.m
@@ -10,7 +10,7 @@
 % This file is part of the VLFeat library and is made available under
 % the terms of the BSD license (see the COPYING file).
 
-if isscalar(a)
+if isscalar(a) || isscalar(b)
   a = alpha * a + beta * b ;
   return ;
 elseif isa(a, 'gpuArray')
diff --git a/matlab/vl_tshow.m b/matlab/vl_tshow.m
new file mode 100644
index 00000000..87b63516
--- /dev/null
+++ b/matlab/vl_tshow.m
@@ -0,0 +1,51 @@
+function vl_tshow(T, varargin)
+%VL_TSHOW Visualize a 4D tensor.
+%   VL_TSHOW(T) shows the 4D tensor T in the current figure.
+%
+%   The tensor is shown as a montage of 2D slices (e.g. filters), with the
+%   3rd dimension stacked along the rows and the 4th dimension along the
+%   columns.
+%
+%   VL_TSHOW(T, 'option', value, ...) accepts the following options:
+%
+%   `labels`:: true
+%     If true, labels the x/y axis of the montage.
+%
+%   Any additional options are passed to IMAGESC (e.g. to set the parent
+%   axes, or other properties).
+
+% Copyright (C) 2017 Joao F. Henriques.
+% All rights reserved.
+%
+% This file is part of the VLFeat library and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+opts.labels = true ;
+[opts, varargin] = vl_argparse(opts, varargin, 'nonrecursive') ;
+
+assert((isnumeric(T) || islogical(T)) && ndims(T) <= 4, ...
+  'T must be a 4D numeric or logical tensor.') ;
+
+% Stack input channels along rows (merge 1st dim. with 3rd), and output
+% channels along columns (merge 2nd dim. with 4th), to form a 2D image
+sz = size(T) ;
+sz(end+1:4) = 1 ;
+T = reshape(permute(T, [1 3 2 4]), sz(1) * sz(3), sz(2) * sz(4)) ;
+
+% Display it
+h = imagesc(T, varargin{:}) ;
+
+ax = get(h, 'Parent') ;
+axis(ax, 'image') ;
+
+% Display grid between filters
+set(ax, 'XGrid', 'on', 'YGrid', 'on', 'GridAlpha', 1, ...
+        'TickLength', [0 0], 'XTickLabel', {}, 'YTickLabel', {}, ...
+        'YTick', sz(1) + 0.5 : sz(1) : sz(1) * sz(3) - 0.5, ...
+        'XTick', sz(2) + 0.5 : sz(2) : sz(2) * sz(4) - 0.5) ;
+
+if opts.labels
+  xlabel(sprintf('Output channels (%i)', sz(4)), 'Parent', ax) ;
+  ylabel(sprintf('Input channels (%i)', sz(3)), 'Parent', ax) ;
+end
+
diff --git a/matlab/xtest/cmyk.jpg b/matlab/xtest/cmyk.jpg
new file mode 100644
index 00000000..a489c0df
Binary files /dev/null and b/matlab/xtest/cmyk.jpg differ
diff --git a/matlab/xtest/suite/nnconv.m b/matlab/xtest/suite/nnconv.m
index 2bb96b0c..f878a646 100644
--- a/matlab/xtest/suite/nnconv.m
+++ b/matlab/xtest/suite/nnconv.m
@@ -176,7 +176,7 @@ function test_gpu_correctnes(test)
       fn = 10 ;
       n = 8 ;
       depth = 8 ;
-      x = test.randn(128,128,depth,n) ;
+      x = test.randn(64,64,depth,n) ;
       w = test.randn(fh,fw,depth,fn) ;
       b = test.randn(1,fn) ;
 
diff --git a/matlab/xtest/suite/nnmnist.m b/matlab/xtest/suite/nnmnist.m
index c632689d..3731fe7d 100644
--- a/matlab/xtest/suite/nnmnist.m
+++ b/matlab/xtest/suite/nnmnist.m
@@ -1,6 +1,6 @@
 classdef nnmnist < nntest
   properties (TestParameter)
-    networkType = {'dagnn', 'simplenn'}
+    networkType = {'simplenn', 'dagnn'}
   end
 
   methods (TestClassSetup)
@@ -13,7 +13,8 @@ function init(test)
     function valErrorRate(test, networkType)
       clear mex ; % will reset GPU, remove MCN to avoid crashing
                   % MATLAB on exit (BLAS issues?)
-      if strcmp(test.dataType, 'double'), return ; end
+      if strcmp(test.currentDataType, 'double'), return ; end
+      rng(0);  % fix random seed, for reproducible tests
       switch test.currentDevice
         case 'cpu'
           gpus = [];
diff --git a/matlab/xtest/suite/nnpdist.m b/matlab/xtest/suite/nnpdist.m
index f2f7fd3d..a778c9b4 100644
--- a/matlab/xtest/suite/nnpdist.m
+++ b/matlab/xtest/suite/nnpdist.m
@@ -10,7 +10,7 @@ function basic(test,oneToOne, noRoot, p, aggregate)
       if aggregate
         % make it smaller to avoid numerical derivative issues with
         % float
-        h = 3 ;
+        h = 2 ;
         w = 2 ;
       else
         h = 13 ;
diff --git a/matlab/xtest/suite/nnroipool.m b/matlab/xtest/suite/nnroipool.m
new file mode 100644
index 00000000..d7be9b4f
--- /dev/null
+++ b/matlab/xtest/suite/nnroipool.m
@@ -0,0 +1,51 @@
+classdef nnroipool < nntest
+  properties
+    x
+  end
+
+  properties (TestParameter)
+    method = {'avg', 'max'}
+    subdivisions = {[1 1], [2 1], [1 2], [3 7], [16 16]}
+  end
+
+  methods (TestClassSetup)
+    function data(test,device)
+      % make sure that all elements in x are different. in this way,
+      % we can compute numerical derivatives reliably by adding a delta < .5.
+      x = test.randn(15,14,3,2) ;
+      x(:) = randperm(numel(x))' ;
+      test.x = x ;
+      test.range = 10 ;
+      if strcmp(device,'gpu'), test.x = gpuArray(test.x) ; end
+    end
+  end
+
+  methods (Test)
+    function basic(test,method,subdivisions)
+      R = [1  1 1 2   2 2 1 1 ;
+           0  1 2 0   1 2 1 1 ;
+           0  4 3 0   1 2 1 1 ;
+           15 5 6 15  4 2 9 0 ;
+           14 7 9 14  4 8 1 0] ;
+      R = test.toDevice(test.toDataType(R)) ;
+      x = test.x ;
+      args = {'method', method, 'subdivisions', subdivisions} ;
+      y = vl_nnroipool(x,R,args{:}) ;
+      dzdy = test.randn(size(y)) ;
+      dzdx = vl_nnroipool(x,R,dzdy,args{:}) ;
+      test.der(@(x) vl_nnroipool(x,R,args{:}), ...
+               x, dzdy, dzdx, test.range * 1e-2) ;
+    end
+
+    function identity(test,method)
+      x = test.toDevice(test.toDataType((2:10)'*(1:10))) ;
+      R = test.toDevice(test.toDataType([1, 1, 1, 9, 10])) ;
+      T = [0 1 0 ; 1 0 0] ;
+      opts = {'method', method, ...
+              'subdivisions', [9,10], ...
+              'transform', T} ;
+      y = vl_nnroipool(x,R,opts{:}) ;
+      test.eq(x,y) ;
+    end
+  end
+end
diff --git a/matlab/xtest/suite/nnsolvers.m b/matlab/xtest/suite/nnsolvers.m
new file mode 100644
index 00000000..5f231515
--- /dev/null
+++ b/matlab/xtest/suite/nnsolvers.m
@@ -0,0 +1,77 @@
+classdef nnsolvers < nntest
+  properties (TestParameter)
+    networkType = {'simplenn', 'dagnn'}
+    solver = {[], @solver.adagrad, @solver.adadelta, @solver.rmsprop, @solver.adam}
+  end
+  properties
+    imdb
+    init_w
+    init_b
+  end
+
+  methods (TestClassSetup)
+    function data(test, dataType)
+      % synthetic data, 2 classes of gaussian samples with different means
+      rng(0) ;
+      sz = [15, 10, 5] ;  % input size
+      x1 = 2 * randn([sz, 100], dataType) ;  % place mean at the origin
+      x2 = bsxfun(@plus, 2 * randn(sz, dataType), 2 * randn([sz, 100], dataType)) ;  % place mean randomly
+      
+      test.imdb.x = cat(4, x1, x2) ;
+      test.imdb.y = [ones(100, 1, dataType); 2 * ones(100, 1, dataType)] ;
+      
+      test.init_w = 1e-3 * randn([sz, 2], dataType) ;  % initial parameters
+      test.init_b = zeros([2, 1], dataType) ;
+    end
+  end
+
+  methods (Test)
+    function basic(test, networkType, solver)
+      clear mex ; % will reset GPU, remove MCN to avoid crashing
+                  % MATLAB on exit (BLAS issues?)
+
+      if strcmp(networkType, 'simplenn') && strcmp(test.currentDataType, 'double')
+        return  % simplenn does not work well with doubles
+      end
+
+      % a simple logistic regression network
+      net.layers = {struct('type','conv', 'weights',{{test.init_w, test.init_b}}), ...
+                    struct('type','softmaxloss')} ;
+      
+      switch test.currentDevice
+        case 'cpu', gpus = [];
+        case 'gpu', gpus = 1;
+      end
+
+      switch networkType
+        case 'simplenn',
+          trainfn = @cnn_train ;
+          getBatch = @(imdb, batch) deal(imdb.x(:,:,:,batch), imdb.y(batch)) ;
+          
+        case 'dagnn',
+          trainfn = @cnn_train_dag ;
+          
+          if isempty(gpus)
+            getBatch = @(imdb, batch) ...
+                {'input',imdb.x(:,:,:,batch), 'label',imdb.y(batch)} ;
+          else
+            getBatch = @(imdb, batch) ...
+                {'input',gpuArray(imdb.x(:,:,:,batch)), 'label',imdb.y(batch)} ;
+          end
+          
+          net = dagnn.DagNN.fromSimpleNN(net, 'canonicalNames', true) ;
+          net.addLayer('top1err', dagnn.Loss('loss', 'classerror'), ...
+                      {'prediction','label'}, 'top1err') ;
+      end
+
+      % train 1 epoch with small batches and check convergence
+      [~, info] = trainfn(net, test.imdb, getBatch, ...
+        'train', 1:numel(test.imdb.y), 'val', 1, ...
+        'solver', solver, 'batchSize', 10, 'numEpochs',1, ...
+        'continue', false, 'gpus', gpus, 'plotStatistics', false) ;
+      
+      test.verifyLessThan(info.train.top1err, 0.35);
+      test.verifyLessThan(info.train.objective, 0.5);
+    end
+  end
+end
diff --git a/matlab/xtest/vl_test_imreadjpeg.m b/matlab/xtest/vl_test_imreadjpeg.m
index 42d39cc8..25f17b77 100644
--- a/matlab/xtest/vl_test_imreadjpeg.m
+++ b/matlab/xtest/vl_test_imreadjpeg.m
@@ -7,6 +7,12 @@
 end
 ims = vl_imreadjpeg(files) ;
 
+% Test reading a CMYK image
+ims_cmyk = vl_imreadjpeg({which('cmyk.jpg')}) ;
+
+ims = vl_imreadjpeg(files) ;
+assert(all(~cellfun(@isempty, ims)), 'Imagae Files not loaded.');
+
 % Test inserting a non-image file
 files_ = files ;
 files_{3} = [mfilename('fullpath') '.m'];
@@ -35,3 +41,5 @@
   ims___ = vl_imreadjpeg(files, 'numThreads', n) ;
   assert(isequal(ims,ims___)) ;
 end
+
+ims = vl_imreadjpeg(files) ;
diff --git a/matlab/xtest/vl_testnn.m b/matlab/xtest/vl_testnn.m
index d6e92e24..4bba8545 100644
--- a/matlab/xtest/vl_testnn.m
+++ b/matlab/xtest/vl_testnn.m
@@ -24,6 +24,11 @@ function vl_testnn(varargin)
 %    Output the test results to a file. If a specified file does 
 %    exist it is overwritten.
 %
+%  `suiteDir`:: ''
+%    Specifies the directory where the test suite files are located. If
+%    left empty, the default suite is used (<MatConvNetRoot>/matlab/xtest/
+%    /suite).
+%
 %  This function uses the Matlab unit testing framework which was
 %  introduced in Matlab R2013a (v8.1).
 
@@ -40,12 +45,14 @@ function vl_testnn(varargin)
 opts.command = 'nn' ;
 opts.break = false ;
 opts.tapFile = '';
+opts.suiteDir = '' ;
 opts = vl_argparse(opts, varargin) ;
 
 import matlab.unittest.constraints.* ;
 import matlab.unittest.selectors.* ;
 import matlab.unittest.plugins.TAPPlugin;
 import matlab.unittest.plugins.ToFile;
+addpath(fullfile(vl_rootnn, 'examples'));
 
 % Choose which tests to run
 sel = HasName(StartsWithSubstring(opts.command)) ;
@@ -62,9 +69,15 @@ function vl_testnn(varargin)
   sel = sel & ~HasName(ContainsSubstring('dataType=single')) ;
 end
 
-% Run tests
 root = fileparts(mfilename('fullpath')) ;
-suite = matlab.unittest.TestSuite.fromFolder(fullfile(root, 'suite'), sel) ;
+if isempty(opts.suiteDir)
+  opts.suiteDir = fullfile(root, 'suite') ;
+else  % any external subclasses of nntest will need it to be on the path
+  addpath(fullfile(root, 'suite')) ;
+end
+
+% Run tests
+suite = matlab.unittest.TestSuite.fromFolder(opts.suiteDir, sel) ;
 runner = matlab.unittest.TestRunner.withTextOutput('Verbosity',3);
 if opts.break
   runner.addPlugin(matlab.unittest.plugins.StopOnFailuresPlugin) ;
diff --git a/utils/import-caffe.py b/utils/import-caffe.py
index c307df72..3981c029 100755
--- a/utils/import-caffe.py
+++ b/utils/import-caffe.py
@@ -92,6 +92,11 @@ def escape(name):
 parser.add_argument('output',
                     type=argparse.FileType('w'),
                     help='Output MATLAB file')
+parser.add_argument('--full-image-size',
+                    type=str,
+                    nargs='?',
+                    default=None,
+                    help='Size of the full image')
 parser.add_argument('--average-image',
                     type=argparse.FileType('rb'),
                     nargs='?',
@@ -185,8 +190,10 @@ def escape(name):
   import proto.caffe_6e3916_pb2 as caffe_pb2
 elif args.caffe_variant == 'caffe_b590f1d':
   import proto.caffe_b590f1d_pb2 as caffe_pb2
+elif args.caffe_variant == 'caffe_fastrcnn':
+  import proto.caffe_fastrcnn_pb2 as caffe_pb2
 elif args.caffe_variant == '?':
-  print 'Supported variants: caffe, vgg-caffe, caffe-old, caffe_0115, caffe_6e3916, caffe_5b0f1d'
+  print 'Supported variants: caffe, vgg-caffe, caffe-old, caffe_0115, caffe_6e3916, caffe_b590f1d, caffe_fastrcnn'
   sys.exit(0)
 else:
   print 'Unknown Caffe variant', args.caffe_variant
@@ -333,7 +340,7 @@ def getopts(layer, name):
 #                                   Read layers in a CaffeModel object
 # --------------------------------------------------------------------
 
-if args.caffe_variant in ['caffe_b590f1d']:
+if args.caffe_variant in ['caffe_b590f1d', 'caffe_fastrcnn']:
   layers_list = net.layer
   data_layers_list = data.layer
 else:
@@ -503,6 +510,14 @@ def getopts(layer, name):
                        coeff = opts.coeff,
                        stable_prod_grad = opts.stable_prod_grad)
 
+  # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+  elif ltype in ['roipooling', 'ROIPooling']:
+    opts = getopts(layer, 'roi_pooling_param')
+    clayer = CaffeROIPooling(layer.name, bottom, top,
+                             pooled_w = opts.pooled_w,
+                             pooled_h = opts.pooled_h,
+                             spatial_scale = opts.spatial_scale)
+
   # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
   elif ltype in ['accuracy', 'Accuracy']:
     continue
@@ -526,47 +541,32 @@ def getopts(layer, name):
           clayer.setBlob(cmodel, i, blob)
 
 # --------------------------------------------------------------------
-#                             Get the size of the input to the network
+#                                Get the size of the network variables
 # --------------------------------------------------------------------
 
+# Get the sizes of the network inputs
 for i, inputVarName in enumerate(net.input):
   if hasattr(net, 'input_shape') and net.input_shape:
-    shape = copy.deepcopy(net.input_shape[i])
+    shape = net.input_shape[i].dim._values
+
+    # ensure that shape is a list of dimensions
+    if isinstance(shape, caffe_pb2.BlobShape):
+      # shape.tolist() may not preserve the order of dimensions
+      shape = shape.dim._values
+
     shape.reverse()
   else:
     shape = [net.input_dim[k + 4*i] for k in [3,2,1,0]]
-  print '  c- Input \'{}\' is {}'.format(inputVarName, shape)
-  cmodel.vars[inputVarName].shape = shape
-  # heuristic: the first input or 'data' is the input image
-  if i == 0 or inputVarName == 'data': dataShape = shape
 
-  # mark any 3-channels input as BGR for the purpose of RGB conversion
-  # rare Caffe networks are trained in RGB format, so this can be skipped
-  # this is decided based on the value of the --color-format option
-  if cmodel.vars[inputVarName].shape[2] == 3:
-    cmodel.vars[inputVarName].bgrInput = (args.color_format == 'bgr')
+  cmodel.vars[inputVarName].shape = shape
+  print '  c- Input \'{}\' is {}'.format(inputVarName, shape)
 
 # --------------------------------------------------------------------
-#                                                      Edit operations
+#                                                             Sanitize
 # --------------------------------------------------------------------
 
-# The first step is to compute the size of all the variables in the
-# model, starting from the input. A small number of conversions
-# require this information to be done properly. In particular:
-#
-# * For Pooling layers, fix incompatibility between pooling padding in MatConvNet and Caffe
-# * For Crop layers (in FCNs), determine the amount of crop (in Caffe this is done at run time)
-
-cmodel.reshape()
-
-# Next, MATLAB uses a column major image format, whereas Caffe uses a
-# row major.  We fix this by transposing X and Y in all spatial
-# layers.
-
-if args.transpose: cmodel.transpose()
-
-# Rename layers, parametrs, and variables if they contain
-# symbols that are incompatible with MatConvNet
+# Rename layers, parametrs, and variables if they contain symbols that
+# are incompatible with MatConvNet.
 
 layerNames = cmodel.layers.keys()
 for name in layerNames:
@@ -593,7 +593,9 @@ def getopts(layer, name):
   print "Renaming parameter {} to {}".format(name, ename)
   cmodel.renameParam(name, ename)
 
-# Split in-place layers
+# Split in-place layers. MatConvNet handles such optimizations
+# differently.
+
 for layer in cmodel.layers.itervalues():
   if len(layer.inputs[0]) >= 1 and \
         len(layer.outputs[0]) >= 1 and \
@@ -601,12 +603,48 @@ def getopts(layer, name):
     name = layer.inputs[0]
     ename = layer.inputs[0]
     while cmodel.vars.has_key(ename): ename = ename + 'x'
-    print "Splitting in-place: renaming variable {} to {}".format(name, ename)
+    print "Splitting in-place layer: renaming variable {} to {}".format(name, ename)
     cmodel.addVar(ename)
     cmodel.renameVar(name, ename, afterLayer=layer.name)
     layer.inputs[0] = name
     layer.outputs[0] = ename
 
+# --------------------------------------------------------------------
+#                                                   Get variable sizes
+# --------------------------------------------------------------------
+
+# Get the size of all other variables. This information is required
+# for some special layer conversions:
+#
+# * For Pooling layers, fix incompatibility between padding in
+#   MatConvNet and Caffe.
+#
+# * For Crop layers (in FCNs), determine the amount of crop (in Caffe
+#   this is done at run time).
+
+# Unflatten ROIPooling. ROIPooling will produce a H x W array instead
+# of a stacked version of the same. The reshape operation below will
+# convert the following InnerProduct layers in corresponding
+# convolitions. This works well with transposition later.
+
+layerNames = cmodel.layers.keys()
+for name in layerNames:
+  layer = cmodel.layers[name]
+  if type(layer) is CaffeROIPooling:
+    childrenNames = cmodel.getLayersWithInput(layer.outputs[0])
+    for childName in childrenNames:
+      child = cmodel.layers[childName]
+      if type(child) is not CaffeInnerProduct:
+        print "Error: cannot unflatten ROIPooling if this is not followed only InnerProduct layers"
+        sys.exit(1)
+  layer.flatten = False
+
+cmodel.reshape()
+
+# --------------------------------------------------------------------
+#                                                                 Edit
+# --------------------------------------------------------------------
+
 # Remove dropout
 if args.remove_dropout:
   layerNames = cmodel.layers.keys()
@@ -618,7 +656,7 @@ def getopts(layer, name):
       cmodel.removeLayer(name)
 
 # Remove loss
-if args.remove_dropout:
+if args.remove_loss:
   layerNames = cmodel.layers.keys()
   for name in layerNames:
     layer = cmodel.layers[name]
@@ -627,9 +665,27 @@ def getopts(layer, name):
       cmodel.renameVar(layer.outputs[0], layer.inputs[0])
       cmodel.removeLayer(name)
 
+# Append softmax
+for i, name in enumerate(args.append_softmax):
+  # search for the layer to append SoftMax to
+  if not cmodel.layers.has_key(name):
+    print 'Cannot append softmax to layer {} as no such layer could be found'.format(name)
+    sys.exit(1)
+
+  if len(args.append_softmax) > 1:
+    layerName = 'softmax' + (l + 1)
+    outputs= ['prob' + (l + 1)]
+  else:
+    layerName = 'softmax'
+    outputs = ['prob']
+
+  cmodel.addLayer(CaffeSoftMax(layerName,
+                               cmodel.layers[name].outputs[0:1],
+                               outputs))
+
 # Simplifications
 if args.simplify:
-  # BatchNorm followed by Scale
+  # Merge BatchNorm followed by Scale
   layerNames = cmodel.layers.keys()
   for name in layerNames:
     layer = cmodel.layers[name]
@@ -656,23 +712,46 @@ def getopts(layer, name):
       cmodel.renameVar(layer.outputs[0], layer.inputs[0])
       cmodel.removeLayer(name)
 
-# Append softmax
-for i, name in enumerate(args.append_softmax):
-  # search for the layer to append SoftMax to
-  if not cmodel.layers.has_key(name):
-    print 'Cannot append softmax to layer {} as no such layer could be found'.format(name)
-    sys.exit(1)
+# --------------------------------------------------------------------
+#                                                        Transposition
+# --------------------------------------------------------------------
+#
+# There are a few different conventions in MATLAB and Caffe:
+#
+# * In MATLAB, the frist spatial dimension is Y (vertical) followed by
+#   X (horizontal), whereas in Caffe the opposite is true.
+#
+# * In MATLAB, images are stored in RGB format, whereas Caffe uses
+#   BGR.
+#
+# * In MatConvNet, the first spatial coordinate is Y, whereas in Caffe
+#   it is X. This affects layers such as ROI pooling.
+#
+# These conventions means that, if the network is directly saved in
+# MCN format, then images and spatial coordinates are transposed as
+# just described. While this is not a deal breaker, it is
+# inconvenient.
+#
+# Thus we transpose all X,Y spatial dimensions in the network. For now,
+# this is partially heuristic. In the future, we should add adapter layer to
+# convert from MCN inputs and outputs to Caffe input and outputs and then
+# simplity those away using graph transformations.
 
-  if len(args.append_softmax) > 1:
-    layerName = 'softmax' + (l + 1)
-    outputs= ['prob' + (l + 1)]
+# Mark variables:
+#   - requiring BGR -> RGB conversion
+#   - requiring XY transposition
+
+for i, inputVarName in enumerate(net.input):
+  if inputVarName == 'data' or i == 0:
+    if cmodel.vars[inputVarName].shape[2] == 3:
+      cmodel.vars[inputVarName].bgrInput = (args.color_format == 'bgr')
+  if not inputVarName == 'rois':
+    cmodel.vars[inputVarName].transposable = True
   else:
-    layerName = 'softmax'
-    outputs = ['prob']
+    cmodel.vars[inputVarName].transposable = False
 
-  cmodel.addLayer(CaffeSoftMax(layerName,
-                               cmodel.layers[name].outputs[0:1],
-                               outputs))
+# Apply transformations
+if args.transpose: cmodel.transpose()
 
 cmodel.display()
 
@@ -680,6 +759,28 @@ def getopts(layer, name):
 #                                                        Normalization
 # --------------------------------------------------------------------
 
+minputs = np.empty(shape=[0,], dtype=minputdt)
+
+# Determine the size of the inputs and input image (dataShape)
+for i, inputVarName in enumerate(net.input):
+  shape = cmodel.vars[inputVarName].shape
+  # add metadata
+  minput = np.empty(shape=[1,], dtype=minputdt)
+  minput['name'][0] = inputVarName
+  minput['size'][0] = row(shape)
+  minputs = np.append(minputs, minput, axis=0)
+  # heuristic: the first input or 'data' is the input image
+  if i == 0 or inputVarName == 'data':
+    dataShape = shape
+
+print "Input image data tensor shape:", dataShape
+
+fullImageSize = [256, 256]
+if args.full_image_size:
+  fullImageSize = list(make_tuple(args.full_image_size))
+
+print "Full input image size:", fullImageSize
+
 if average_image is not None:
   if resize_average_image:
     x = numpy.linspace(0, average_image.shape[1]-1, dataShape[0])
@@ -694,12 +795,33 @@ def getopts(layer, name):
   'averageImage': average_image,
   'interpolation': 'bilinear',
   'keepAspect': True,
-  'border': row([0,0])}
+  'border': row([0,0]),
+  'cropSize': 1.0}
+
+if len(fullImageSize) == 1:
+  fw = max(fullImageSize[0],dataShape[1])
+  fh = max(fullImageSize[0],dataShape[0])
+  mnormalization['border'] = max([float(fw - dataShape[1]),
+                                  float(fh - dataShape[0])])
+  mnormalization['cropSize'] = min([float(dataShape[1]) / fw,
+                                    float(dataShape[0]) / fh])
+else:
+  fw = max(fullImageSize[0],dataShape[1])
+  fh = max(fullImageSize[1],dataShape[0])
+  mnormalization['border'] = row([float(fw - dataShape[1]),
+                                  float(fh - dataShape[0])])
+  mnormalization['cropSize'] = row([float(dataShape[1]) / fw,
+                                    float(dataShape[0]) / fh])
+
+if args.caffe_variant == 'caffe_fastrcnn':
+  mnormalization['interpolation'] = 'bilinear'
 
 if args.preproc == 'caffe':
   mnormalization['interpolation'] = 'bicubic'
   mnormalization['keepAspect'] = False
-  mnormalization['border'] = row([256 - dataShape[0], 256 - dataShape[1]])
+
+print 'Input image border: ', mnormalization['border']
+print 'Full input image relative crop size: ', mnormalization['cropSize']
 
 # --------------------------------------------------------------------
 #                                                              Classes
@@ -722,7 +844,8 @@ def getopts(layer, name):
 # --------------------------------------------------------------------
 
 # net.meta
-mmeta = dictToMatlabStruct({'normalization': mnormalization,
+mmeta = dictToMatlabStruct({'inputs': minputs.reshape(1,-1),
+                            'normalization': mnormalization,
                             'classes': mclasses})
 
 if args.output_format == 'dagnn':
diff --git a/utils/import-fast-rcnn.sh b/utils/import-fast-rcnn.sh
new file mode 100755
index 00000000..c17c3db3
--- /dev/null
+++ b/utils/import-fast-rcnn.sh
@@ -0,0 +1,99 @@
+#! /bin/bash
+# brief: Import Fast R-CNN models
+# author: Abhishek Dutta
+# author: Hakan Bilen
+
+# Models are written to <MATCONVNET>/data/models-import/fast-rcnn
+# You can delete <MATCONVNET>/data/models-import/fast-rcnn/fast_rcnn_models.tgz
+
+# TODO apply patch to prototxt which will resize the outputs of cls layers from 205 -> 1000 (maybe sed?)
+
+overwrite=no
+
+# urls for all FRCNN models
+FRCNN_CAFFENET_PROTO_URL=https://raw.githubusercontent.com/rbgirshick/fast-rcnn/master/models/CaffeNet/test.prototxt
+FRCNN_VGGM1K_PROTO_URL=https://raw.githubusercontent.com/rbgirshick/fast-rcnn/master/models/VGG_CNN_M_1024/test.prototxt
+FRCNN_VGG16_PROTO_URL=https://raw.githubusercontent.com/rbgirshick/fast-rcnn/master/models/VGG16/test.prototxt
+
+FRCNN_MODEL_URL=https://people.eecs.berkeley.edu/~rbg/fast-rcnn-data/fast_rcnn_models.tgz
+
+# source: https://github.com/rbgirshick/fast-rcnn/blob/90e75082f087596f28173546cba615d41f0d38fe/lib/fast_rcnn/config.py
+FRCNN_AVERAGE_COLOR="(122.7717, 115.9465, 102.9801)"
+FRCNN_CLASSES="('background', 'aeroplane', 'bicycle', 'bird', 'boat', 'bottle', 'bus', 'car', 'cat', 'chair', 'cow', 'diningtable', 'dog', 'horse', 'motorbike', 'person', 'pottedplant', 'sheep', 'sofa', 'train', 'tvmonitor')"
+
+# Obtain the path of this script
+pushd `dirname $0` > /dev/null
+SCRIPTPATH=`pwd`
+popd > /dev/null
+
+converter="python $SCRIPTPATH/import-caffe.py"
+data="$SCRIPTPATH/../data/models-import"
+
+mkdir -p "$data/tmp/fast-rcnn"
+
+function get()
+{
+    "$SCRIPTPATH/get-file.sh" "$data/tmp/fast-rcnn" "$1"
+}
+
+# --------------------------------------------------------------------
+# FCN models
+# --------------------------------------------------------------------
+
+if true
+then
+    echo "Downloading pre-trained fast-rcnn model files (this may take some time) ..."
+    get $FRCNN_CAFFENET_PROTO_URL
+    mv $data/tmp/fast-rcnn/test.prototxt $data/tmp/fast-rcnn/caffenet_test.prototxt
+    get $FRCNN_VGGM1K_PROTO_URL
+    mv $data/tmp/fast-rcnn/test.prototxt $data/tmp/fast-rcnn/vggm1k_test.prototxt
+    get $FRCNN_VGG16_PROTO_URL
+    mv $data/tmp/fast-rcnn/test.prototxt $data/tmp/fast-rcnn/vgg16_test.prototxt
+    get $FRCNN_MODEL_URL
+    (cd $data/tmp/fast-rcnn ; tar -zxf fast_rcnn_models.tgz)
+fi
+
+if true
+then
+
+    ins=( \
+        caffenet_fast_rcnn_iter_40000 \
+        vgg_cnn_m_1024_fast_rcnn_iter_40000 \
+        vgg16_fast_rcnn_iter_40000)
+    protos=( \
+        caffenet_test \
+        vggm1k_test \
+        vgg16_test)
+    outs=( \
+        fast-rcnn-caffenet-pascal07-dagnn \
+        fast-rcnn-vggm1k-pascal07-dagnn \
+        fast-rcnn-vgg16-pascal07-dagnn \
+        fast-rcnn-vgg16-pascal07-12-dagnn \
+        fast-rcnn-vgg16-pascal12-dagnn \
+        )
+
+    for ((i=0;i<${#ins[@]};++i)); do
+        in="$data/tmp/fast-rcnn/fast_rcnn_models/${ins[i]}"
+        out="$data/${outs[i]}.mat"
+        if test -f "$out" -a -z "$overwrite"
+        then
+            echo "$out exists; skipping."
+        else
+            echo "Exporting caffe model to matconvnet format (this may also take some time) ..."
+            $converter \
+                --caffe-variant=caffe_fastrcnn \
+                --remove-dropout \
+                --remove-loss \
+                --average-value="${FRCNN_AVERAGE_COLOR}" \
+                --full-image-size=[600] \
+                --class-names="${FRCNN_CLASSES}" \
+                $data/tmp/fast-rcnn/"${protos[i]}".prototxt \
+                --output-format=dagnn \
+                --caffe-data="$in".caffemodel \
+                "$out"
+        fi
+    done
+fi
+
+
+echo "Note: you may now delete the models-import/tmp directory"
diff --git a/utils/import-fcn.sh b/utils/import-fcn.sh
index c1501f7b..4cb879fc 100755
--- a/utils/import-fcn.sh
+++ b/utils/import-fcn.sh
@@ -71,7 +71,7 @@ then
             #PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp \
             $converter \
                 --caffe-variant=caffe_6e3916 \
-                --preproc=fcn \
+                --full-image-size=[500] \
 		--remove-dropout \
                 --remove-loss \
                 --average-value="${FCN_AVERAGE_COLOR}" \
diff --git a/utils/layers.py b/utils/layers.py
index 79ecec5a..4a8f0c05 100644
--- a/utils/layers.py
+++ b/utils/layers.py
@@ -4,6 +4,7 @@
 
 from collections import OrderedDict
 from math import floor, ceil
+from operator import mul
 import numpy as np
 from numpy import array
 import scipy
@@ -99,6 +100,9 @@ def dictToMatlabStruct(d):
 mparamdt = [('name',object),
             ('value',object)]
 
+minputdt = [('name',object),
+            ('size',object)]
+
 # --------------------------------------------------------------------
 #                                                      Vars and params
 # --------------------------------------------------------------------
@@ -109,6 +113,7 @@ def __init__(self, name):
         self.shape = None
         self.value = np.zeros(shape=(0,0), dtype='float32')
         self.bgrInput = False
+        self.transposable = True # first two dimensions are spatial
 
     def transpose(self):
         if self.shape: self.shape = [self.shape[k] for k in [1,0,2,3]]
@@ -122,6 +127,9 @@ def toMatlab(self):
     def toMatlabSimpleNN(self):
         return self.value
 
+    def hasValue(self):
+        return reduce(mul, self.value.shape, 1) > 0
+
 class CaffeTransform(object):
     def __init__(self, size, stride, offset):
         self.shape = size
@@ -417,7 +425,8 @@ def transpose(self, model):
         self.kernel_size = reorder(self.kernel_size, [1,0])
         self.stride = reorder(self.stride, [1,0])
         self.pad = reorder(self.pad, [2,3,0,1])
-        if model.params[self.params[0]].value.shape > 0:
+        self.dilation = reorder(self.dilation, [1,0])
+        if model.params[self.params[0]].hasValue():
             print "Layer %s: transposing filters" % self.name
             param = model.params[self.params[0]]
             param.value = param.value.transpose([1,0,2,3])
@@ -433,7 +442,8 @@ def toMatlab(self):
             {'hasBias': self.bias_term,
              'size': row(size),
              'pad': row(self.pad),
-             'stride': row(self.stride)})
+             'stride': row(self.stride),
+             'dilate': row(self.dilation)})
         return mlayer
 
     def toMatlabSimpleNN(self):
@@ -444,6 +454,7 @@ def toMatlabSimpleNN(self):
         mlayer['size'] = row(size)
         mlayer['pad'] = row(self.pad)
         mlayer['stride'] = row(self.stride)
+        mlayer['dilate'] = row(self.dilation)
         for p, name in enumerate(self.params):
             mlayer['weights'][0,p] = self.model.params[name].toMatlabSimpleNN()
         return mlayer
@@ -484,7 +495,7 @@ def reshape(self, model):
         print "Layer %s: inner product converted to filter bank of shape %s" \
             % (self.name, self.kernel_size)
         param = model.params[self.params[0]]
-        if param.value.shape > 0:
+        if param.hasValue():
             print "Layer %s: reshaping inner product paramters of shape %s into a filter bank" % (self.name, param.value.shape)
             param.value = param.value.reshape(self.kernel_size, order='F')
         super(CaffeInnerProduct, self).reshape(model)
@@ -541,7 +552,7 @@ def transpose(self, model):
         self.kernel_size = reorder(self.kernel_size, [1,0])
         self.stride = reorder(self.stride, [1,0])
         self.pad = reorder(self.pad, [2,3,0,1])
-        if model.params[self.params[0]].value.shape > 0:
+        if model.params[self.params[0]].hasValue():
             print "Layer %s transposing filters" % self.name
             param = model.params[self.params[0]]
             param.value = param.value.transpose([1,0,2,3])
@@ -654,6 +665,73 @@ def toMatlabSimpleNN(self):
             print "Warning: pad correction for layer %s could not be computed because the layer input shape could not be determined" % (self.name)
         return mlayer
 
+# --------------------------------------------------------------------
+#                                                           ROIPooling
+# --------------------------------------------------------------------
+
+class CaffeROIPooling(CaffeLayer):
+    def __init__(self, name, inputs, outputs,
+                 pooled_w,
+                 pooled_h,
+                 spatial_scale):
+        super(CaffeROIPooling, self).__init__(name, inputs, outputs)
+        self.pooled_w = pooled_w
+        self.pooled_h = pooled_h
+        self.spatial_scale = spatial_scale
+        self.flatten = True
+
+    def display(self):
+        super(CaffeROIPooling, self).display()
+        print "  c- pooled_w: %s" % (self.pooled_w,)
+        print "  c- pooled_h: %s" % (self.pooled_h,)
+        print "  c- spatial_scale: %s" % (self.spatial_scale,)
+        print "  c- flatten: %s" % (self.flatten,)
+
+    def reshape(self, model):
+        shape1 = model.vars[self.inputs[0]].shape
+        shape2 = model.vars[self.inputs[1]].shape
+        if not shape1 or not shape2: return
+        numChannels = shape1[2]
+        numROIs = reduce(mul, shape2, 1) / 5
+        if self.flatten:
+            oshape =  [1,
+                       1,
+                       self.pooled_w * self.pooled_h * numChannels,
+                       numROIs]
+        else:
+            oshape =  [self.pooled_w,
+                       self.pooled_h,
+                       numChannels,
+                       numROIs]
+        model.vars[self.outputs[0]].shape = oshape
+
+    def getTransforms(self, model):
+        # no transform
+        return [[CaffeTransform([1.,1.], [1.,1.], [1.,1.])]]
+
+    def transpose(self, model):
+        assert(not self.flatten)
+        tmp = self.pooled_w
+        self.pooled_w = self.pooled_h
+        self.pooled_h = tmp
+
+    def toMatlab(self):
+        mlayer = super(CaffeROIPooling, self).toMatlab()
+        mlayer['type'][0] = u'dagnn.ROIPooling'
+        mlayer['block'][0] = dictToMatlabStruct(
+            {'subdivisions':row([self.pooled_w, self.pooled_h]),
+             'transform':self.spatial_scale,
+             'flatten':self.flatten})
+        return mlayer
+
+    def toMatlabSimpleNN(self):
+        mlayer = super(CaffeROIPooling, self).toMatlabSimpleNN()
+        mlayer['type'] = u'roipool'
+        mlayer['subdivisions'] = row([self.pooled_w, self.pooled_h])
+        mlayer['transform'] = self.spatial_scale
+        mlayer['flatten'] = self.flatten
+        return mlayer
+
 # --------------------------------------------------------------------
 #                                                                Scale
 # --------------------------------------------------------------------
@@ -1061,7 +1139,7 @@ def display(self):
 
     def transpose(self):
         for var in self.vars.itervalues():
-            var.transpose()
+            if var.transposable: var.transpose()
         for layer in self.layers.itervalues():
             layer.transpose(self)
 
diff --git a/utils/model2dot.m b/utils/model2dot.m
index a8e8313a..cddd6de9 100644
--- a/utils/model2dot.m
+++ b/utils/model2dot.m
@@ -33,7 +33,7 @@ function model2dot(modelPath, outPath, varargin)
 fprintf('Loading %s.\n', modelPath);
 obj = load(modelPath);
 
-if isstruct(obj.layers) % DAGnn format
+if isstruct(obj.layers) % DagNN format
   net = dagnn.DagNN.loadobj(obj);
 elseif iscell(obj.layers)
   net = dagnn.DagNN.fromSimpleNN(obj);
@@ -42,13 +42,22 @@ function model2dot(modelPath, outPath, varargin)
 end
 
 inputs = opts.inputs;
-inputNames = net.getInputs();
-if isempty(inputs) && numel(inputNames) == 1 ...
-  && isfield(obj, 'meta') && isfield(obj.meta, 'normalization') ...
-  && isfield(obj.meta.normalization, 'imageSize')
-  inputSize = [obj.meta.normalization.imageSize(1:3), opts.batchSize];
-  fprintf('Input %s guessed to be: %s.\n', inputNames{1}, mat2str(inputSize));
-  inputs = {inputNames{1}, inputSize};
+if isempty(inputs)
+  inputs = {} ;
+  inputNames = net.getInputs() ;
+  for i = 1:numel(inputNames)
+    inputSize = [NaN NaN NaN NaN] ;
+    if isprop(net, 'meta') || isfield(net, 'meta')
+      if isfield(net.meta, 'inputs')
+        ii = find(strcmp(inputNames{i}, {net.meta.inputs.name})) ;
+        inputSize = net.meta.inputs(ii).size ;
+      elseif isfield(net.meta, 'normalization') && ...
+          (i == 1 || strcmp(inputNames{i}, 'data'))
+        inputSize = [net.meta.normalization.imageSize(1:3), 1] ;
+      end
+    end
+    inputs = {inputs{:}, inputNames{i}, inputSize} ;
+  end
 end
 
 if isempty(inputs)
diff --git a/utils/proto/caffe_fastrcnn.proto b/utils/proto/caffe_fastrcnn.proto
new file mode 100644
index 00000000..5f02f91d
--- /dev/null
+++ b/utils/proto/caffe_fastrcnn.proto
@@ -0,0 +1,987 @@
+syntax = "proto2";
+
+// source: https://raw.githubusercontent.com/rbgirshick/caffe-fast-rcnn/bcd9b4eadc7d8fbc433aeefd564e82ec63aaf69c/src/caffe/proto/caffe.proto
+
+package caffe;
+
+// Specifies the shape (dimensions) of a Blob.
+message BlobShape {
+  repeated int64 dim = 1 [packed = true];
+}
+
+message BlobProto {
+  optional BlobShape shape = 7;
+  repeated float data = 5 [packed = true];
+  repeated float diff = 6 [packed = true];
+
+  // 4D dimensions -- deprecated.  Use "shape" instead.
+  optional int32 num = 1 [default = 0];
+  optional int32 channels = 2 [default = 0];
+  optional int32 height = 3 [default = 0];
+  optional int32 width = 4 [default = 0];
+}
+
+// The BlobProtoVector is simply a way to pass multiple blobproto instances
+// around.
+message BlobProtoVector {
+  repeated BlobProto blobs = 1;
+}
+
+message Datum {
+  optional int32 channels = 1;
+  optional int32 height = 2;
+  optional int32 width = 3;
+  // the actual image data, in bytes
+  optional bytes data = 4;
+  optional int32 label = 5;
+  // Optionally, the datum could also hold float data.
+  repeated float float_data = 6;
+  // If true data contains an encoded image that need to be decoded
+  optional bool encoded = 7 [default = false];
+}
+
+message FillerParameter {
+  // The filler type.
+  optional string type = 1 [default = 'constant'];
+  optional float value = 2 [default = 0]; // the value in constant filler
+  optional float min = 3 [default = 0]; // the min value in uniform filler
+  optional float max = 4 [default = 1]; // the max value in uniform filler
+  optional float mean = 5 [default = 0]; // the mean value in Gaussian filler
+  optional float std = 6 [default = 1]; // the std value in Gaussian filler
+  // The expected number of non-zero output weights for a given input in
+  // Gaussian filler -- the default -1 means don't perform sparsification.
+  optional int32 sparse = 7 [default = -1];
+}
+
+message NetParameter {
+  optional string name = 1; // consider giving the network a name
+  // The input blobs to the network.
+  repeated string input = 3;
+  // The shape of the input blobs.
+  repeated BlobShape input_shape = 8;
+
+  // 4D input dimensions -- deprecated.  Use "shape" instead.
+  // If specified, for each input blob there should be four
+  // values specifying the num, channels, height and width of the input blob.
+  // Thus, there should be a total of (4 * #input) numbers.
+  repeated int32 input_dim = 4;
+
+  // Whether the network will force every layer to carry out backward operation.
+  // If set False, then whether to carry out backward is determined
+  // automatically according to the net structure and learning rates.
+  optional bool force_backward = 5 [default = false];
+  // The current "state" of the network, including the phase, level, and stage.
+  // Some layers may be included/excluded depending on this state and the states
+  // specified in the layers' include and exclude fields.
+  optional NetState state = 6;
+
+  // Print debugging information about results while running Net::Forward,
+  // Net::Backward, and Net::Update.
+  optional bool debug_info = 7 [default = false];
+
+  // The layers that make up the net.  Each of their configurations, including
+  // connectivity and behavior, is specified as a LayerParameter.
+  repeated LayerParameter layer = 100;  // ID 100 so layers are printed last.
+
+  // DEPRECATED: use 'layer' instead.
+  repeated V1LayerParameter layers = 2;
+}
+
+// NOTE
+// Update the next available ID when you add a new SolverParameter field.
+//
+// SolverParameter next available ID: 36 (last added: clip_gradients)
+message SolverParameter {
+  //////////////////////////////////////////////////////////////////////////////
+  // Specifying the train and test networks
+  //
+  // Exactly one train net must be specified using one of the following fields:
+  //     train_net_param, train_net, net_param, net
+  // One or more test nets may be specified using any of the following fields:
+  //     test_net_param, test_net, net_param, net
+  // If more than one test net field is specified (e.g., both net and
+  // test_net are specified), they will be evaluated in the field order given
+  // above: (1) test_net_param, (2) test_net, (3) net_param/net.
+  // A test_iter must be specified for each test_net.
+  // A test_level and/or a test_stage may also be specified for each test_net.
+  //////////////////////////////////////////////////////////////////////////////
+
+  // Proto filename for the train net, possibly combined with one or more
+  // test nets.
+  optional string net = 24;
+  // Inline train net param, possibly combined with one or more test nets.
+  optional NetParameter net_param = 25;
+
+  optional string train_net = 1; // Proto filename for the train net.
+  repeated string test_net = 2; // Proto filenames for the test nets.
+  optional NetParameter train_net_param = 21; // Inline train net params.
+  repeated NetParameter test_net_param = 22; // Inline test net params.
+
+  // The states for the train/test nets. Must be unspecified or
+  // specified once per net.
+  //
+  // By default, all states will have solver = true;
+  // train_state will have phase = TRAIN,
+  // and all test_state's will have phase = TEST.
+  // Other defaults are set according to the NetState defaults.
+  optional NetState train_state = 26;
+  repeated NetState test_state = 27;
+
+  // The number of iterations for each test net.
+  repeated int32 test_iter = 3;
+
+  // The number of iterations between two testing phases.
+  optional int32 test_interval = 4 [default = 0];
+  optional bool test_compute_loss = 19 [default = false];
+  // If true, run an initial test pass before the first iteration,
+  // ensuring memory availability and printing the starting value of the loss.
+  optional bool test_initialization = 32 [default = true];
+  optional float base_lr = 5; // The base learning rate
+  // the number of iterations between displaying info. If display = 0, no info
+  // will be displayed.
+  optional int32 display = 6;
+  // Display the loss averaged over the last average_loss iterations
+  optional int32 average_loss = 33 [default = 1];
+  optional int32 max_iter = 7; // the maximum number of iterations
+  optional string lr_policy = 8; // The learning rate decay policy.
+  optional float gamma = 9; // The parameter to compute the learning rate.
+  optional float power = 10; // The parameter to compute the learning rate.
+  optional float momentum = 11; // The momentum value.
+  optional float weight_decay = 12; // The weight decay.
+  // regularization types supported: L1 and L2
+  // controlled by weight_decay
+  optional string regularization_type = 29 [default = "L2"];
+  // the stepsize for learning rate policy "step"
+  optional int32 stepsize = 13;
+  // the stepsize for learning rate policy "multistep"
+  repeated int32 stepvalue = 34;
+
+  // Set clip_gradients to >= 0 to clip parameter gradients to that L2 norm,
+  // whenever their actual L2 norm is larger.
+  optional float clip_gradients = 35 [default = -1];
+
+  optional int32 snapshot = 14 [default = 0]; // The snapshot interval
+  optional string snapshot_prefix = 15; // The prefix for the snapshot.
+  // whether to snapshot diff in the results or not. Snapshotting diff will help
+  // debugging but the final protocol buffer size will be much larger.
+  optional bool snapshot_diff = 16 [default = false];
+  // the mode solver will use: 0 for CPU and 1 for GPU. Use GPU in default.
+  enum SolverMode {
+    CPU = 0;
+    GPU = 1;
+  }
+  optional SolverMode solver_mode = 17 [default = GPU];
+  // the device_id will that be used in GPU mode. Use device_id = 0 in default.
+  optional int32 device_id = 18 [default = 0];
+  // If non-negative, the seed with which the Solver will initialize the Caffe
+  // random number generator -- useful for reproducible results. Otherwise,
+  // (and by default) initialize using a seed derived from the system clock.
+  optional int64 random_seed = 20 [default = -1];
+
+  // Solver type
+  enum SolverType {
+    SGD = 0;
+    NESTEROV = 1;
+    ADAGRAD = 2;
+  }
+  optional SolverType solver_type = 30 [default = SGD];
+  // numerical stability for AdaGrad
+  optional float delta = 31 [default = 1e-8];
+
+  // If true, print information about the state of the net that may help with
+  // debugging learning problems.
+  optional bool debug_info = 23 [default = false];
+
+  // If false, don't save a snapshot after training finishes.
+  optional bool snapshot_after_train = 28 [default = true];
+}
+
+// A message that stores the solver snapshots
+message SolverState {
+  optional int32 iter = 1; // The current iteration
+  optional string learned_net = 2; // The file that stores the learned net.
+  repeated BlobProto history = 3; // The history for sgd solvers
+  optional int32 current_step = 4 [default = 0]; // The current step for learning rate
+}
+
+enum Phase {
+   TRAIN = 0;
+   TEST = 1;
+}
+
+message NetState {
+  optional Phase phase = 1 [default = TEST];
+  optional int32 level = 2 [default = 0];
+  repeated string stage = 3;
+}
+
+message NetStateRule {
+  // Set phase to require the NetState have a particular phase (TRAIN or TEST)
+  // to meet this rule.
+  optional Phase phase = 1;
+
+  // Set the minimum and/or maximum levels in which the layer should be used.
+  // Leave undefined to meet the rule regardless of level.
+  optional int32 min_level = 2;
+  optional int32 max_level = 3;
+
+  // Customizable sets of stages to include or exclude.
+  // The net must have ALL of the specified stages and NONE of the specified
+  // "not_stage"s to meet the rule.
+  // (Use multiple NetStateRules to specify conjunctions of stages.)
+  repeated string stage = 4;
+  repeated string not_stage = 5;
+}
+
+// Specifies training parameters (multipliers on global learning constants,
+// and the name and other settings used for weight sharing).
+message ParamSpec {
+  // The names of the parameter blobs -- useful for sharing parameters among
+  // layers, but never required otherwise.  To share a parameter between two
+  // layers, give it a (non-empty) name.
+  optional string name = 1;
+
+  // Whether to require shared weights to have the same shape, or just the same
+  // count -- defaults to STRICT if unspecified.
+  optional DimCheckMode share_mode = 2;
+  enum DimCheckMode {
+    // STRICT (default) requires that num, channels, height, width each match.
+    STRICT = 0;
+    // PERMISSIVE requires only the count (num*channels*height*width) to match.
+    PERMISSIVE = 1;
+  }
+
+  // The multiplier on the global learning rate for this parameter.
+  optional float lr_mult = 3 [default = 1.0];
+
+  // The multiplier on the global weight decay for this parameter.
+  optional float decay_mult = 4 [default = 1.0];
+}
+
+// NOTE
+// Update the next available ID when you add a new LayerParameter field.
+//
+// LayerParameter next available layer-specific ID: 132 (last added: prelu_param)
+message LayerParameter {
+  optional string name = 1; // the layer name
+  optional string type = 2; // the layer type
+  repeated string bottom = 3; // the name of each bottom blob
+  repeated string top = 4; // the name of each top blob
+
+  // The train / test phase for computation.
+  optional Phase phase = 10;
+
+  // The amount of weight to assign each top blob in the objective.
+  // Each layer assigns a default value, usually of either 0 or 1,
+  // to each top blob.
+  repeated float loss_weight = 5;
+
+  // Specifies training parameters (multipliers on global learning constants,
+  // and the name and other settings used for weight sharing).
+  repeated ParamSpec param = 6;
+
+  // The blobs containing the numeric parameters of the layer.
+  repeated BlobProto blobs = 7;
+
+  // Rules controlling whether and when a layer is included in the network,
+  // based on the current NetState.  You may specify a non-zero number of rules
+  // to include OR exclude, but not both.  If no include or exclude rules are
+  // specified, the layer is always included.  If the current NetState meets
+  // ANY (i.e., one or more) of the specified rules, the layer is
+  // included/excluded.
+  repeated NetStateRule include = 8;
+  repeated NetStateRule exclude = 9;
+
+  // Parameters for data pre-processing.
+  optional TransformationParameter transform_param = 100;
+
+  // Parameters shared by loss layers.
+  optional LossParameter loss_param = 101;
+
+  // Layer type-specific parameters.
+  //
+  // Note: certain layers may have more than one computational engine
+  // for their implementation. These layers include an Engine type and
+  // engine parameter for selecting the implementation.
+  // The default for the engine is set by the ENGINE switch at compile-time.
+  optional AccuracyParameter accuracy_param = 102;
+  optional ArgMaxParameter argmax_param = 103;
+  optional ConcatParameter concat_param = 104;
+  optional ContrastiveLossParameter contrastive_loss_param = 105;
+  optional ConvolutionParameter convolution_param = 106;
+  optional DataParameter data_param = 107;
+  optional DropoutParameter dropout_param = 108;
+  optional DummyDataParameter dummy_data_param = 109;
+  optional EltwiseParameter eltwise_param = 110;
+  optional ExpParameter exp_param = 111;
+  optional HDF5DataParameter hdf5_data_param = 112;
+  optional HDF5OutputParameter hdf5_output_param = 113;
+  optional HingeLossParameter hinge_loss_param = 114;
+  optional ImageDataParameter image_data_param = 115;
+  optional InfogainLossParameter infogain_loss_param = 116;
+  optional InnerProductParameter inner_product_param = 117;
+  optional LRNParameter lrn_param = 118;
+  optional MemoryDataParameter memory_data_param = 119;
+  optional MVNParameter mvn_param = 120;
+  optional PoolingParameter pooling_param = 121;
+  optional PowerParameter power_param = 122;
+  optional PReLUParameter prelu_param = 131;
+  optional PythonParameter python_param = 130;
+  optional ReLUParameter relu_param = 123;
+  optional ROIPoolingParameter roi_pooling_param = 8266711;
+  optional SigmoidParameter sigmoid_param = 124;
+  optional SoftmaxParameter softmax_param = 125;
+  optional SliceParameter slice_param = 126;
+  optional TanHParameter tanh_param = 127;
+  optional ThresholdParameter threshold_param = 128;
+  optional WindowDataParameter window_data_param = 129;
+}
+
+// Message that stores parameters used to apply transformation
+// to the data layer's data
+message TransformationParameter {
+  // For data pre-processing, we can do simple scaling and subtracting the
+  // data mean, if provided. Note that the mean subtraction is always carried
+  // out before scaling.
+  optional float scale = 1 [default = 1];
+  // Specify if we want to randomly mirror data.
+  optional bool mirror = 2 [default = false];
+  // Specify if we would like to randomly crop an image.
+  optional uint32 crop_size = 3 [default = 0];
+  // mean_file and mean_value cannot be specified at the same time
+  optional string mean_file = 4;
+  // if specified can be repeated once (would substract it from all the channels)
+  // or can be repeated the same number of times as channels
+  // (would subtract them from the corresponding channel)
+  repeated float mean_value = 5;
+}
+
+// Message that stores parameters shared by loss layers
+message LossParameter {
+  // If specified, ignore instances with the given label.
+  optional int32 ignore_label = 1;
+  // If true, normalize each batch across all instances (including spatial
+  // dimesions, but not ignored instances); else, divide by batch size only.
+  optional bool normalize = 2 [default = true];
+}
+
+// Message that stores parameters used by AccuracyLayer
+message AccuracyParameter {
+  // When computing accuracy, count as correct by comparing the true label to
+  // the top k scoring classes.  By default, only compare to the top scoring
+  // class (i.e. argmax).
+  optional uint32 top_k = 1 [default = 1];
+
+  // The "label" axis of the prediction blob, whose argmax corresponds to the
+  // predicted label -- may be negative to index from the end (e.g., -1 for the
+  // last axis).  For example, if axis == 1 and the predictions are
+  // (N x C x H x W), the label blob is expected to contain N*H*W ground truth
+  // labels with integer values in {0, 1, ..., C-1}.
+  optional int32 axis = 2 [default = 1];
+
+  // If specified, ignore instances with the given label.
+  optional int32 ignore_label = 3;
+}
+
+// Message that stores parameters used by ArgMaxLayer
+message ArgMaxParameter {
+  // If true produce pairs (argmax, maxval)
+  optional bool out_max_val = 1 [default = false];
+  optional uint32 top_k = 2 [default = 1];
+}
+
+// Message that stores parameters used by ConcatLayer
+message ConcatParameter {
+  // The axis along which to concatenate -- may be negative to index from the
+  // end (e.g., -1 for the last axis).  Other axes must have the
+  // same dimension for all the bottom blobs.
+  // By default, ConcatLayer concatenates blobs along the "channels" axis (1).
+  optional int32 axis = 2 [default = 1];
+
+  // DEPRECATED: alias for "axis" -- does not support negative indexing.
+  optional uint32 concat_dim = 1 [default = 1];
+}
+
+// Message that stores parameters used by ContrastiveLossLayer
+message ContrastiveLossParameter {
+  //margin for dissimilar pair
+  optional float margin = 1 [default = 1.0];
+}
+
+// Message that stores parameters used by ConvolutionLayer
+message ConvolutionParameter {
+  optional uint32 num_output = 1; // The number of outputs for the layer
+  optional bool bias_term = 2 [default = true]; // whether to have bias terms
+  // Pad, kernel size, and stride are all given as a single value for equal
+  // dimensions in height and width or as Y, X pairs.
+  optional uint32 pad = 3 [default = 0]; // The padding size (equal in Y, X)
+  optional uint32 pad_h = 9 [default = 0]; // The padding height
+  optional uint32 pad_w = 10 [default = 0]; // The padding width
+  optional uint32 kernel_size = 4; // The kernel size (square)
+  optional uint32 kernel_h = 11; // The kernel height
+  optional uint32 kernel_w = 12; // The kernel width
+  optional uint32 group = 5 [default = 1]; // The group size for group conv
+  optional uint32 stride = 6 [default = 1]; // The stride (equal in Y, X)
+  optional uint32 stride_h = 13; // The stride height
+  optional uint32 stride_w = 14; // The stride width
+  optional FillerParameter weight_filler = 7; // The filler for the weight
+  optional FillerParameter bias_filler = 8; // The filler for the bias
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 15 [default = DEFAULT];
+}
+
+// Message that stores parameters used by DataLayer
+message DataParameter {
+  enum DB {
+    LEVELDB = 0;
+    LMDB = 1;
+  }
+  // Specify the data source.
+  optional string source = 1;
+  // Specify the batch size.
+  optional uint32 batch_size = 4;
+  // The rand_skip variable is for the data layer to skip a few data points
+  // to avoid all asynchronous sgd clients to start at the same point. The skip
+  // point would be set as rand_skip * rand(0,1). Note that rand_skip should not
+  // be larger than the number of keys in the database.
+  optional uint32 rand_skip = 7 [default = 0];
+  optional DB backend = 8 [default = LEVELDB];
+  // DEPRECATED. See TransformationParameter. For data pre-processing, we can do
+  // simple scaling and subtracting the data mean, if provided. Note that the
+  // mean subtraction is always carried out before scaling.
+  optional float scale = 2 [default = 1];
+  optional string mean_file = 3;
+  // DEPRECATED. See TransformationParameter. Specify if we would like to randomly
+  // crop an image.
+  optional uint32 crop_size = 5 [default = 0];
+  // DEPRECATED. See TransformationParameter. Specify if we want to randomly mirror
+  // data.
+  optional bool mirror = 6 [default = false];
+  // Force the encoded image to have 3 color channels
+  optional bool force_encoded_color = 9 [default = false];
+}
+
+// Message that stores parameters used by DropoutLayer
+message DropoutParameter {
+  optional float dropout_ratio = 1 [default = 0.5]; // dropout ratio
+}
+
+// Message that stores parameters used by DummyDataLayer.
+// DummyDataLayer fills any number of arbitrarily shaped blobs with random
+// (or constant) data generated by "Fillers" (see "message FillerParameter").
+message DummyDataParameter {
+  // This layer produces N >= 1 top blobs.  DummyDataParameter must specify 1 or N
+  // shape fields, and 0, 1 or N data_fillers.
+  //
+  // If 0 data_fillers are specified, ConstantFiller with a value of 0 is used.
+  // If 1 data_filler is specified, it is applied to all top blobs.  If N are
+  // specified, the ith is applied to the ith top blob.
+  repeated FillerParameter data_filler = 1;
+  repeated BlobShape shape = 6;
+
+  // 4D dimensions -- deprecated.  Use "shape" instead.
+  repeated uint32 num = 2;
+  repeated uint32 channels = 3;
+  repeated uint32 height = 4;
+  repeated uint32 width = 5;
+}
+
+// Message that stores parameters used by EltwiseLayer
+message EltwiseParameter {
+  enum EltwiseOp {
+    PROD = 0;
+    SUM = 1;
+    MAX = 2;
+  }
+  optional EltwiseOp operation = 1 [default = SUM]; // element-wise operation
+  repeated float coeff = 2; // blob-wise coefficient for SUM operation
+
+  // Whether to use an asymptotically slower (for >2 inputs) but stabler method
+  // of computing the gradient for the PROD operation. (No effect for SUM op.)
+  optional bool stable_prod_grad = 3 [default = true];
+}
+
+// Message that stores parameters used by ExpLayer
+message ExpParameter {
+  // ExpLayer computes outputs y = base ^ (shift + scale * x), for base > 0.
+  // Or if base is set to the default (-1), base is set to e,
+  // so y = exp(shift + scale * x).
+  optional float base = 1 [default = -1.0];
+  optional float scale = 2 [default = 1.0];
+  optional float shift = 3 [default = 0.0];
+}
+
+// Message that stores parameters used by HDF5DataLayer
+message HDF5DataParameter {
+  // Specify the data source.
+  optional string source = 1;
+  // Specify the batch size.
+  optional uint32 batch_size = 2;
+
+  // Specify whether to shuffle the data.
+  // If shuffle == true, the ordering of the HDF5 files is shuffled,
+  // and the ordering of data within any given HDF5 file is shuffled,
+  // but data between different files are not interleaved; all of a file's
+  // data are output (in a random order) before moving onto another file.
+  optional bool shuffle = 3 [default = false];
+}
+
+// Message that stores parameters used by HDF5OutputLayer
+message HDF5OutputParameter {
+  optional string file_name = 1;
+}
+
+message HingeLossParameter {
+  enum Norm {
+    L1 = 1;
+    L2 = 2;
+  }
+  // Specify the Norm to use L1 or L2
+  optional Norm norm = 1 [default = L1];
+}
+
+// Message that stores parameters used by ImageDataLayer
+message ImageDataParameter {
+  // Specify the data source.
+  optional string source = 1;
+  // Specify the batch size.
+  optional uint32 batch_size = 4;
+  // The rand_skip variable is for the data layer to skip a few data points
+  // to avoid all asynchronous sgd clients to start at the same point. The skip
+  // point would be set as rand_skip * rand(0,1). Note that rand_skip should not
+  // be larger than the number of keys in the database.
+  optional uint32 rand_skip = 7 [default = 0];
+  // Whether or not ImageLayer should shuffle the list of files at every epoch.
+  optional bool shuffle = 8 [default = false];
+  // It will also resize images if new_height or new_width are not zero.
+  optional uint32 new_height = 9 [default = 0];
+  optional uint32 new_width = 10 [default = 0];
+  // Specify if the images are color or gray
+  optional bool is_color = 11 [default = true];
+  // DEPRECATED. See TransformationParameter. For data pre-processing, we can do
+  // simple scaling and subtracting the data mean, if provided. Note that the
+  // mean subtraction is always carried out before scaling.
+  optional float scale = 2 [default = 1];
+  optional string mean_file = 3;
+  // DEPRECATED. See TransformationParameter. Specify if we would like to randomly
+  // crop an image.
+  optional uint32 crop_size = 5 [default = 0];
+  // DEPRECATED. See TransformationParameter. Specify if we want to randomly mirror
+  // data.
+  optional bool mirror = 6 [default = false];
+  optional string root_folder = 12 [default = ""];
+}
+
+// Message that stores parameters InfogainLossLayer
+message InfogainLossParameter {
+  // Specify the infogain matrix source.
+  optional string source = 1;
+}
+
+// Message that stores parameters used by InnerProductLayer
+message InnerProductParameter {
+  optional uint32 num_output = 1; // The number of outputs for the layer
+  optional bool bias_term = 2 [default = true]; // whether to have bias terms
+  optional FillerParameter weight_filler = 3; // The filler for the weight
+  optional FillerParameter bias_filler = 4; // The filler for the bias
+
+  // The first axis to be lumped into a single inner product computation;
+  // all preceding axes are retained in the output.
+  // May be negative to index from the end (e.g., -1 for the last axis).
+  optional int32 axis = 5 [default = 1];
+}
+
+// Message that stores parameters used by LRNLayer
+message LRNParameter {
+  optional uint32 local_size = 1 [default = 5];
+  optional float alpha = 2 [default = 1.];
+  optional float beta = 3 [default = 0.75];
+  enum NormRegion {
+    ACROSS_CHANNELS = 0;
+    WITHIN_CHANNEL = 1;
+  }
+  optional NormRegion norm_region = 4 [default = ACROSS_CHANNELS];
+  optional float k = 5 [default = 1.];
+}
+
+// Message that stores parameters used by MemoryDataLayer
+message MemoryDataParameter {
+  optional uint32 batch_size = 1;
+  optional uint32 channels = 2;
+  optional uint32 height = 3;
+  optional uint32 width = 4;
+}
+
+// Message that stores parameters used by MVNLayer
+message MVNParameter {
+  // This parameter can be set to false to normalize mean only
+  optional bool normalize_variance = 1 [default = true];
+
+  // This parameter can be set to true to perform DNN-like MVN
+  optional bool across_channels = 2 [default = false];
+}
+
+// Message that stores parameters used by PoolingLayer
+message PoolingParameter {
+  enum PoolMethod {
+    MAX = 0;
+    AVE = 1;
+    STOCHASTIC = 2;
+  }
+  optional PoolMethod pool = 1 [default = MAX]; // The pooling method
+  // Pad, kernel size, and stride are all given as a single value for equal
+  // dimensions in height and width or as Y, X pairs.
+  optional uint32 pad = 4 [default = 0]; // The padding size (equal in Y, X)
+  optional uint32 pad_h = 9 [default = 0]; // The padding height
+  optional uint32 pad_w = 10 [default = 0]; // The padding width
+  optional uint32 kernel_size = 2; // The kernel size (square)
+  optional uint32 kernel_h = 5; // The kernel height
+  optional uint32 kernel_w = 6; // The kernel width
+  optional uint32 stride = 3 [default = 1]; // The stride (equal in Y, X)
+  optional uint32 stride_h = 7; // The stride height
+  optional uint32 stride_w = 8; // The stride width
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 11 [default = DEFAULT];
+  // If global_pooling then it will pool over the size of the bottom by doing
+  // kernel_h = bottom->height and kernel_w = bottom->width
+  optional bool global_pooling = 12 [default = false];
+}
+
+// Message that stores parameters used by PowerLayer
+message PowerParameter {
+  // PowerLayer computes outputs y = (shift + scale * x) ^ power.
+  optional float power = 1 [default = 1.0];
+  optional float scale = 2 [default = 1.0];
+  optional float shift = 3 [default = 0.0];
+}
+
+// Message that stores parameters used by PythonLayer
+message PythonParameter {
+  optional string module = 1;
+  optional string layer = 2;
+  // This value is set to the attribute `param_str_` of your custom
+  // `PythonLayer` object in Python before calling `setup()` method. This could
+  // be a number, a string, a dictionary in Python dict format or JSON etc. You
+  // may parse this string in `setup` method and use them in `forward` and
+  // `backward`.
+  optional string param_str = 3 [default = ''];
+}
+
+// Message that stores parameters used by ReLULayer
+message ReLUParameter {
+  // Allow non-zero slope for negative inputs to speed up optimization
+  // Described in:
+  // Maas, A. L., Hannun, A. Y., & Ng, A. Y. (2013). Rectifier nonlinearities
+  // improve neural network acoustic models. In ICML Workshop on Deep Learning
+  // for Audio, Speech, and Language Processing.
+  optional float negative_slope = 1 [default = 0];
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 2 [default = DEFAULT];
+}
+
+// Message that stores parameters used by ROIPoolingLayer
+message ROIPoolingParameter {
+  // Pad, kernel size, and stride are all given as a single value for equal
+  // dimensions in height and width or as Y, X pairs.
+  optional uint32 pooled_h = 1 [default = 0]; // The pooled output height
+  optional uint32 pooled_w = 2 [default = 0]; // The pooled output width
+  // Multiplicative spatial scale factor to translate ROI coords from their
+  // input scale to the scale used when pooling
+  optional float spatial_scale = 3 [default = 1];
+}
+
+// Message that stores parameters used by SigmoidLayer
+message SigmoidParameter {
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 1 [default = DEFAULT];
+}
+
+// Message that stores parameters used by SliceLayer
+message SliceParameter {
+  // The axis along which to slice -- may be negative to index from the end
+  // (e.g., -1 for the last axis).
+  // By default, SliceLayer concatenates blobs along the "channels" axis (1).
+  optional int32 axis = 3 [default = 1];
+  repeated uint32 slice_point = 2;
+
+  // DEPRECATED: alias for "axis" -- does not support negative indexing.
+  optional uint32 slice_dim = 1 [default = 1];
+}
+
+// Message that stores parameters used by SoftmaxLayer, SoftmaxWithLossLayer
+message SoftmaxParameter {
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 1 [default = DEFAULT];
+
+  // The axis along which to perform the softmax -- may be negative to index
+  // from the end (e.g., -1 for the last axis).
+  // Any other axes will be evaluated as independent softmaxes.
+  optional int32 axis = 2 [default = 1];
+}
+
+// Message that stores parameters used by TanHLayer
+message TanHParameter {
+  enum Engine {
+    DEFAULT = 0;
+    CAFFE = 1;
+    CUDNN = 2;
+  }
+  optional Engine engine = 1 [default = DEFAULT];
+}
+
+// Message that stores parameters used by ThresholdLayer
+message ThresholdParameter {
+  optional float threshold = 1 [default = 0]; // Strictly positive values
+}
+
+// Message that stores parameters used by WindowDataLayer
+message WindowDataParameter {
+  // Specify the data source.
+  optional string source = 1;
+  // For data pre-processing, we can do simple scaling and subtracting the
+  // data mean, if provided. Note that the mean subtraction is always carried
+  // out before scaling.
+  optional float scale = 2 [default = 1];
+  optional string mean_file = 3;
+  // Specify the batch size.
+  optional uint32 batch_size = 4;
+  // Specify if we would like to randomly crop an image.
+  optional uint32 crop_size = 5 [default = 0];
+  // Specify if we want to randomly mirror data.
+  optional bool mirror = 6 [default = false];
+  // Foreground (object) overlap threshold
+  optional float fg_threshold = 7 [default = 0.5];
+  // Background (non-object) overlap threshold
+  optional float bg_threshold = 8 [default = 0.5];
+  // Fraction of batch that should be foreground objects
+  optional float fg_fraction = 9 [default = 0.25];
+  // Amount of contextual padding to add around a window
+  // (used only by the window_data_layer)
+  optional uint32 context_pad = 10 [default = 0];
+  // Mode for cropping out a detection window
+  // warp: cropped window is warped to a fixed size and aspect ratio
+  // square: the tightest square around the window is cropped
+  optional string crop_mode = 11 [default = "warp"];
+  // cache_images: will load all images in memory for faster access
+  optional bool cache_images = 12 [default = false];
+  // append root_folder to locate images
+  optional string root_folder = 13 [default = ""];
+}
+
+// DEPRECATED: use LayerParameter.
+message V1LayerParameter {
+  repeated string bottom = 2;
+  repeated string top = 3;
+  optional string name = 4;
+  repeated NetStateRule include = 32;
+  repeated NetStateRule exclude = 33;
+  enum LayerType {
+    NONE = 0;
+    ABSVAL = 35;
+    ACCURACY = 1;
+    ARGMAX = 30;
+    BNLL = 2;
+    CONCAT = 3;
+    CONTRASTIVE_LOSS = 37;
+    CONVOLUTION = 4;
+    DATA = 5;
+    DECONVOLUTION = 39;
+    DROPOUT = 6;
+    DUMMY_DATA = 32;
+    EUCLIDEAN_LOSS = 7;
+    ELTWISE = 25;
+    EXP = 38;
+    FLATTEN = 8;
+    HDF5_DATA = 9;
+    HDF5_OUTPUT = 10;
+    HINGE_LOSS = 28;
+    IM2COL = 11;
+    IMAGE_DATA = 12;
+    INFOGAIN_LOSS = 13;
+    INNER_PRODUCT = 14;
+    LRN = 15;
+    MEMORY_DATA = 29;
+    MULTINOMIAL_LOGISTIC_LOSS = 16;
+    MVN = 34;
+    POOLING = 17;
+    POWER = 26;
+    RELU = 18;
+    SIGMOID = 19;
+    SIGMOID_CROSS_ENTROPY_LOSS = 27;
+    SILENCE = 36;
+    SOFTMAX = 20;
+    SOFTMAX_LOSS = 21;
+    SPLIT = 22;
+    SLICE = 33;
+    TANH = 23;
+    WINDOW_DATA = 24;
+    THRESHOLD = 31;
+  }
+  optional LayerType type = 5;
+  repeated BlobProto blobs = 6;
+  repeated string param = 1001;
+  repeated DimCheckMode blob_share_mode = 1002;
+  enum DimCheckMode {
+    STRICT = 0;
+    PERMISSIVE = 1;
+  }
+  repeated float blobs_lr = 7;
+  repeated float weight_decay = 8;
+  repeated float loss_weight = 35;
+  optional AccuracyParameter accuracy_param = 27;
+  optional ArgMaxParameter argmax_param = 23;
+  optional ConcatParameter concat_param = 9;
+  optional ContrastiveLossParameter contrastive_loss_param = 40;
+  optional ConvolutionParameter convolution_param = 10;
+  optional DataParameter data_param = 11;
+  optional DropoutParameter dropout_param = 12;
+  optional DummyDataParameter dummy_data_param = 26;
+  optional EltwiseParameter eltwise_param = 24;
+  optional ExpParameter exp_param = 41;
+  optional HDF5DataParameter hdf5_data_param = 13;
+  optional HDF5OutputParameter hdf5_output_param = 14;
+  optional HingeLossParameter hinge_loss_param = 29;
+  optional ImageDataParameter image_data_param = 15;
+  optional InfogainLossParameter infogain_loss_param = 16;
+  optional InnerProductParameter inner_product_param = 17;
+  optional LRNParameter lrn_param = 18;
+  optional MemoryDataParameter memory_data_param = 22;
+  optional MVNParameter mvn_param = 34;
+  optional PoolingParameter pooling_param = 19;
+  optional PowerParameter power_param = 21;
+  optional ReLUParameter relu_param = 30;
+  optional SigmoidParameter sigmoid_param = 38;
+  optional SoftmaxParameter softmax_param = 39;
+  optional SliceParameter slice_param = 31;
+  optional TanHParameter tanh_param = 37;
+  optional ThresholdParameter threshold_param = 25;
+  optional WindowDataParameter window_data_param = 20;
+  optional TransformationParameter transform_param = 36;
+  optional LossParameter loss_param = 42;
+  optional V0LayerParameter layer = 1;
+}
+
+// DEPRECATED: V0LayerParameter is the old way of specifying layer parameters
+// in Caffe.  We keep this message type around for legacy support.
+message V0LayerParameter {
+  optional string name = 1; // the layer name
+  optional string type = 2; // the string to specify the layer type
+
+  // Parameters to specify layers with inner products.
+  optional uint32 num_output = 3; // The number of outputs for the layer
+  optional bool biasterm = 4 [default = true]; // whether to have bias terms
+  optional FillerParameter weight_filler = 5; // The filler for the weight
+  optional FillerParameter bias_filler = 6; // The filler for the bias
+
+  optional uint32 pad = 7 [default = 0]; // The padding size
+  optional uint32 kernelsize = 8; // The kernel size
+  optional uint32 group = 9 [default = 1]; // The group size for group conv
+  optional uint32 stride = 10 [default = 1]; // The stride
+  enum PoolMethod {
+    MAX = 0;
+    AVE = 1;
+    STOCHASTIC = 2;
+  }
+  optional PoolMethod pool = 11 [default = MAX]; // The pooling method
+  optional float dropout_ratio = 12 [default = 0.5]; // dropout ratio
+
+  optional uint32 local_size = 13 [default = 5]; // for local response norm
+  optional float alpha = 14 [default = 1.]; // for local response norm
+  optional float beta = 15 [default = 0.75]; // for local response norm
+  optional float k = 22 [default = 1.];
+
+  // For data layers, specify the data source
+  optional string source = 16;
+  // For data pre-processing, we can do simple scaling and subtracting the
+  // data mean, if provided. Note that the mean subtraction is always carried
+  // out before scaling.
+  optional float scale = 17 [default = 1];
+  optional string meanfile = 18;
+  // For data layers, specify the batch size.
+  optional uint32 batchsize = 19;
+  // For data layers, specify if we would like to randomly crop an image.
+  optional uint32 cropsize = 20 [default = 0];
+  // For data layers, specify if we want to randomly mirror data.
+  optional bool mirror = 21 [default = false];
+
+  // The blobs containing the numeric parameters of the layer
+  repeated BlobProto blobs = 50;
+  // The ratio that is multiplied on the global learning rate. If you want to
+  // set the learning ratio for one blob, you need to set it for all blobs.
+  repeated float blobs_lr = 51;
+  // The weight decay that is multiplied on the global weight decay.
+  repeated float weight_decay = 52;
+
+  // The rand_skip variable is for the data layer to skip a few data points
+  // to avoid all asynchronous sgd clients to start at the same point. The skip
+  // point would be set as rand_skip * rand(0,1). Note that rand_skip should not
+  // be larger than the number of keys in the database.
+  optional uint32 rand_skip = 53 [default = 0];
+
+  // Fields related to detection (det_*)
+  // foreground (object) overlap threshold
+  optional float det_fg_threshold = 54 [default = 0.5];
+  // background (non-object) overlap threshold
+  optional float det_bg_threshold = 55 [default = 0.5];
+  // Fraction of batch that should be foreground objects
+  optional float det_fg_fraction = 56 [default = 0.25];
+
+  // optional bool OBSOLETE_can_clobber = 57 [default = true];
+
+  // Amount of contextual padding to add around a window
+  // (used only by the window_data_layer)
+  optional uint32 det_context_pad = 58 [default = 0];
+
+  // Mode for cropping out a detection window
+  // warp: cropped window is warped to a fixed size and aspect ratio
+  // square: the tightest square around the window is cropped
+  optional string det_crop_mode = 59 [default = "warp"];
+
+  // For ReshapeLayer, one needs to specify the new dimensions.
+  optional int32 new_num = 60 [default = 0];
+  optional int32 new_channels = 61 [default = 0];
+  optional int32 new_height = 62 [default = 0];
+  optional int32 new_width = 63 [default = 0];
+
+  // Whether or not ImageLayer should shuffle the list of files at every epoch.
+  // It will also resize images if new_height or new_width are not zero.
+  optional bool shuffle_images = 64 [default = false];
+
+  // For ConcatLayer, one needs to specify the dimension for concatenation, and
+  // the other dimensions must be the same for all the bottom blobs.
+  // By default it will concatenate blobs along the channels dimension.
+  optional uint32 concat_dim = 65 [default = 1];
+
+  optional HDF5OutputParameter hdf5_output_param = 1001;
+}
+
+// Message that stores parameters used by PReLULayer
+message PReLUParameter {
+  // Parametric ReLU described in K. He et al, Delving Deep into Rectifiers:
+  // Surpassing Human-Level Performance on ImageNet Classification, 2015.
+
+  // Initial value of a_i. Default is a_i=0.25 for all i.
+  optional FillerParameter filler = 1;
+  // Whether or not slope paramters are shared across channels.
+  optional bool channel_shared = 2 [default = false];
+}
diff --git a/utils/proto/caffe_fastrcnn_pb2.py b/utils/proto/caffe_fastrcnn_pb2.py
new file mode 100644
index 00000000..ce0a0a99
--- /dev/null
+++ b/utils/proto/caffe_fastrcnn_pb2.py
@@ -0,0 +1,4439 @@
+# Generated by the protocol buffer compiler.  DO NOT EDIT!
+# source: caffe_fastrcnn.proto
+
+from google.protobuf.internal import enum_type_wrapper
+from google.protobuf import descriptor as _descriptor
+from google.protobuf import message as _message
+from google.protobuf import reflection as _reflection
+from google.protobuf import descriptor_pb2
+# @@protoc_insertion_point(imports)
+
+
+
+
+DESCRIPTOR = _descriptor.FileDescriptor(
+  name='caffe_fastrcnn.proto',
+  package='caffe',
+  serialized_pb='\n\x14\x63\x61\x66\x66\x65_fastrcnn.proto\x12\x05\x63\x61\x66\x66\x65\"\x1c\n\tBlobShape\x12\x0f\n\x03\x64im\x18\x01 \x03(\x03\x42\x02\x10\x01\"\x9a\x01\n\tBlobProto\x12\x1f\n\x05shape\x18\x07 \x01(\x0b\x32\x10.caffe.BlobShape\x12\x10\n\x04\x64\x61ta\x18\x05 \x03(\x02\x42\x02\x10\x01\x12\x10\n\x04\x64iff\x18\x06 \x03(\x02\x42\x02\x10\x01\x12\x0e\n\x03num\x18\x01 \x01(\x05:\x01\x30\x12\x13\n\x08\x63hannels\x18\x02 \x01(\x05:\x01\x30\x12\x11\n\x06height\x18\x03 \x01(\x05:\x01\x30\x12\x10\n\x05width\x18\x04 \x01(\x05:\x01\x30\"2\n\x0f\x42lobProtoVector\x12\x1f\n\x05\x62lobs\x18\x01 \x03(\x0b\x32\x10.caffe.BlobProto\"\x81\x01\n\x05\x44\x61tum\x12\x10\n\x08\x63hannels\x18\x01 \x01(\x05\x12\x0e\n\x06height\x18\x02 \x01(\x05\x12\r\n\x05width\x18\x03 \x01(\x05\x12\x0c\n\x04\x64\x61ta\x18\x04 \x01(\x0c\x12\r\n\x05label\x18\x05 \x01(\x05\x12\x12\n\nfloat_data\x18\x06 \x03(\x02\x12\x16\n\x07\x65ncoded\x18\x07 \x01(\x08:\x05\x66\x61lse\"\x90\x01\n\x0f\x46illerParameter\x12\x16\n\x04type\x18\x01 \x01(\t:\x08\x63onstant\x12\x10\n\x05value\x18\x02 \x01(\x02:\x01\x30\x12\x0e\n\x03min\x18\x03 \x01(\x02:\x01\x30\x12\x0e\n\x03max\x18\x04 \x01(\x02:\x01\x31\x12\x0f\n\x04mean\x18\x05 \x01(\x02:\x01\x30\x12\x0e\n\x03std\x18\x06 \x01(\x02:\x01\x31\x12\x12\n\x06sparse\x18\x07 \x01(\x05:\x02-1\"\x8e\x02\n\x0cNetParameter\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\r\n\x05input\x18\x03 \x03(\t\x12%\n\x0binput_shape\x18\x08 \x03(\x0b\x32\x10.caffe.BlobShape\x12\x11\n\tinput_dim\x18\x04 \x03(\x05\x12\x1d\n\x0e\x66orce_backward\x18\x05 \x01(\x08:\x05\x66\x61lse\x12\x1e\n\x05state\x18\x06 \x01(\x0b\x32\x0f.caffe.NetState\x12\x19\n\ndebug_info\x18\x07 \x01(\x08:\x05\x66\x61lse\x12$\n\x05layer\x18\x64 \x03(\x0b\x32\x15.caffe.LayerParameter\x12\'\n\x06layers\x18\x02 \x03(\x0b\x32\x17.caffe.V1LayerParameter\"\xa7\x08\n\x0fSolverParameter\x12\x0b\n\x03net\x18\x18 \x01(\t\x12&\n\tnet_param\x18\x19 \x01(\x0b\x32\x13.caffe.NetParameter\x12\x11\n\ttrain_net\x18\x01 \x01(\t\x12\x10\n\x08test_net\x18\x02 \x03(\t\x12,\n\x0ftrain_net_param\x18\x15 \x01(\x0b\x32\x13.caffe.NetParameter\x12+\n\x0etest_net_param\x18\x16 \x03(\x0b\x32\x13.caffe.NetParameter\x12$\n\x0btrain_state\x18\x1a \x01(\x0b\x32\x0f.caffe.NetState\x12#\n\ntest_state\x18\x1b \x03(\x0b\x32\x0f.caffe.NetState\x12\x11\n\ttest_iter\x18\x03 \x03(\x05\x12\x18\n\rtest_interval\x18\x04 \x01(\x05:\x01\x30\x12 \n\x11test_compute_loss\x18\x13 \x01(\x08:\x05\x66\x61lse\x12!\n\x13test_initialization\x18  \x01(\x08:\x04true\x12\x0f\n\x07\x62\x61se_lr\x18\x05 \x01(\x02\x12\x0f\n\x07\x64isplay\x18\x06 \x01(\x05\x12\x17\n\x0c\x61verage_loss\x18! \x01(\x05:\x01\x31\x12\x10\n\x08max_iter\x18\x07 \x01(\x05\x12\x11\n\tlr_policy\x18\x08 \x01(\t\x12\r\n\x05gamma\x18\t \x01(\x02\x12\r\n\x05power\x18\n \x01(\x02\x12\x10\n\x08momentum\x18\x0b \x01(\x02\x12\x14\n\x0cweight_decay\x18\x0c \x01(\x02\x12\x1f\n\x13regularization_type\x18\x1d \x01(\t:\x02L2\x12\x10\n\x08stepsize\x18\r \x01(\x05\x12\x11\n\tstepvalue\x18\" \x03(\x05\x12\x1a\n\x0e\x63lip_gradients\x18# \x01(\x02:\x02-1\x12\x13\n\x08snapshot\x18\x0e \x01(\x05:\x01\x30\x12\x17\n\x0fsnapshot_prefix\x18\x0f \x01(\t\x12\x1c\n\rsnapshot_diff\x18\x10 \x01(\x08:\x05\x66\x61lse\x12;\n\x0bsolver_mode\x18\x11 \x01(\x0e\x32!.caffe.SolverParameter.SolverMode:\x03GPU\x12\x14\n\tdevice_id\x18\x12 \x01(\x05:\x01\x30\x12\x17\n\x0brandom_seed\x18\x14 \x01(\x03:\x02-1\x12;\n\x0bsolver_type\x18\x1e \x01(\x0e\x32!.caffe.SolverParameter.SolverType:\x03SGD\x12\x14\n\x05\x64\x65lta\x18\x1f \x01(\x02:\x05\x31\x65-08\x12\x19\n\ndebug_info\x18\x17 \x01(\x08:\x05\x66\x61lse\x12\"\n\x14snapshot_after_train\x18\x1c \x01(\x08:\x04true\"\x1e\n\nSolverMode\x12\x07\n\x03\x43PU\x10\x00\x12\x07\n\x03GPU\x10\x01\"0\n\nSolverType\x12\x07\n\x03SGD\x10\x00\x12\x0c\n\x08NESTEROV\x10\x01\x12\x0b\n\x07\x41\x44\x41GRAD\x10\x02\"l\n\x0bSolverState\x12\x0c\n\x04iter\x18\x01 \x01(\x05\x12\x13\n\x0blearned_net\x18\x02 \x01(\t\x12!\n\x07history\x18\x03 \x03(\x0b\x32\x10.caffe.BlobProto\x12\x17\n\x0c\x63urrent_step\x18\x04 \x01(\x05:\x01\x30\"N\n\x08NetState\x12!\n\x05phase\x18\x01 \x01(\x0e\x32\x0c.caffe.Phase:\x04TEST\x12\x10\n\x05level\x18\x02 \x01(\x05:\x01\x30\x12\r\n\x05stage\x18\x03 \x03(\t\"s\n\x0cNetStateRule\x12\x1b\n\x05phase\x18\x01 \x01(\x0e\x32\x0c.caffe.Phase\x12\x11\n\tmin_level\x18\x02 \x01(\x05\x12\x11\n\tmax_level\x18\x03 \x01(\x05\x12\r\n\x05stage\x18\x04 \x03(\t\x12\x11\n\tnot_stage\x18\x05 \x03(\t\"\xa3\x01\n\tParamSpec\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x31\n\nshare_mode\x18\x02 \x01(\x0e\x32\x1d.caffe.ParamSpec.DimCheckMode\x12\x12\n\x07lr_mult\x18\x03 \x01(\x02:\x01\x31\x12\x15\n\ndecay_mult\x18\x04 \x01(\x02:\x01\x31\"*\n\x0c\x44imCheckMode\x12\n\n\x06STRICT\x10\x00\x12\x0e\n\nPERMISSIVE\x10\x01\"\xea\x0e\n\x0eLayerParameter\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t\x12\x0e\n\x06\x62ottom\x18\x03 \x03(\t\x12\x0b\n\x03top\x18\x04 \x03(\t\x12\x1b\n\x05phase\x18\n \x01(\x0e\x32\x0c.caffe.Phase\x12\x13\n\x0bloss_weight\x18\x05 \x03(\x02\x12\x1f\n\x05param\x18\x06 \x03(\x0b\x32\x10.caffe.ParamSpec\x12\x1f\n\x05\x62lobs\x18\x07 \x03(\x0b\x32\x10.caffe.BlobProto\x12$\n\x07include\x18\x08 \x03(\x0b\x32\x13.caffe.NetStateRule\x12$\n\x07\x65xclude\x18\t \x03(\x0b\x32\x13.caffe.NetStateRule\x12\x37\n\x0ftransform_param\x18\x64 \x01(\x0b\x32\x1e.caffe.TransformationParameter\x12(\n\nloss_param\x18\x65 \x01(\x0b\x32\x14.caffe.LossParameter\x12\x30\n\x0e\x61\x63\x63uracy_param\x18\x66 \x01(\x0b\x32\x18.caffe.AccuracyParameter\x12,\n\x0c\x61rgmax_param\x18g \x01(\x0b\x32\x16.caffe.ArgMaxParameter\x12,\n\x0c\x63oncat_param\x18h \x01(\x0b\x32\x16.caffe.ConcatParameter\x12?\n\x16\x63ontrastive_loss_param\x18i \x01(\x0b\x32\x1f.caffe.ContrastiveLossParameter\x12\x36\n\x11\x63onvolution_param\x18j \x01(\x0b\x32\x1b.caffe.ConvolutionParameter\x12(\n\ndata_param\x18k \x01(\x0b\x32\x14.caffe.DataParameter\x12.\n\rdropout_param\x18l \x01(\x0b\x32\x17.caffe.DropoutParameter\x12\x33\n\x10\x64ummy_data_param\x18m \x01(\x0b\x32\x19.caffe.DummyDataParameter\x12.\n\reltwise_param\x18n \x01(\x0b\x32\x17.caffe.EltwiseParameter\x12&\n\texp_param\x18o \x01(\x0b\x32\x13.caffe.ExpParameter\x12\x31\n\x0fhdf5_data_param\x18p \x01(\x0b\x32\x18.caffe.HDF5DataParameter\x12\x35\n\x11hdf5_output_param\x18q \x01(\x0b\x32\x1a.caffe.HDF5OutputParameter\x12\x33\n\x10hinge_loss_param\x18r \x01(\x0b\x32\x19.caffe.HingeLossParameter\x12\x33\n\x10image_data_param\x18s \x01(\x0b\x32\x19.caffe.ImageDataParameter\x12\x39\n\x13infogain_loss_param\x18t \x01(\x0b\x32\x1c.caffe.InfogainLossParameter\x12\x39\n\x13inner_product_param\x18u \x01(\x0b\x32\x1c.caffe.InnerProductParameter\x12&\n\tlrn_param\x18v \x01(\x0b\x32\x13.caffe.LRNParameter\x12\x35\n\x11memory_data_param\x18w \x01(\x0b\x32\x1a.caffe.MemoryDataParameter\x12&\n\tmvn_param\x18x \x01(\x0b\x32\x13.caffe.MVNParameter\x12.\n\rpooling_param\x18y \x01(\x0b\x32\x17.caffe.PoolingParameter\x12*\n\x0bpower_param\x18z \x01(\x0b\x32\x15.caffe.PowerParameter\x12+\n\x0bprelu_param\x18\x83\x01 \x01(\x0b\x32\x15.caffe.PReLUParameter\x12-\n\x0cpython_param\x18\x82\x01 \x01(\x0b\x32\x16.caffe.PythonParameter\x12(\n\nrelu_param\x18{ \x01(\x0b\x32\x14.caffe.ReLUParameter\x12\x38\n\x11roi_pooling_param\x18\xd7\xc7\xf8\x03 \x01(\x0b\x32\x1a.caffe.ROIPoolingParameter\x12.\n\rsigmoid_param\x18| \x01(\x0b\x32\x17.caffe.SigmoidParameter\x12.\n\rsoftmax_param\x18} \x01(\x0b\x32\x17.caffe.SoftmaxParameter\x12*\n\x0bslice_param\x18~ \x01(\x0b\x32\x15.caffe.SliceParameter\x12(\n\ntanh_param\x18\x7f \x01(\x0b\x32\x14.caffe.TanHParameter\x12\x33\n\x0fthreshold_param\x18\x80\x01 \x01(\x0b\x32\x19.caffe.ThresholdParameter\x12\x36\n\x11window_data_param\x18\x81\x01 \x01(\x0b\x32\x1a.caffe.WindowDataParameter\"\x7f\n\x17TransformationParameter\x12\x10\n\x05scale\x18\x01 \x01(\x02:\x01\x31\x12\x15\n\x06mirror\x18\x02 \x01(\x08:\x05\x66\x61lse\x12\x14\n\tcrop_size\x18\x03 \x01(\r:\x01\x30\x12\x11\n\tmean_file\x18\x04 \x01(\t\x12\x12\n\nmean_value\x18\x05 \x03(\x02\">\n\rLossParameter\x12\x14\n\x0cignore_label\x18\x01 \x01(\x05\x12\x17\n\tnormalize\x18\x02 \x01(\x08:\x04true\"L\n\x11\x41\x63\x63uracyParameter\x12\x10\n\x05top_k\x18\x01 \x01(\r:\x01\x31\x12\x0f\n\x04\x61xis\x18\x02 \x01(\x05:\x01\x31\x12\x14\n\x0cignore_label\x18\x03 \x01(\x05\"?\n\x0f\x41rgMaxParameter\x12\x1a\n\x0bout_max_val\x18\x01 \x01(\x08:\x05\x66\x61lse\x12\x10\n\x05top_k\x18\x02 \x01(\r:\x01\x31\"9\n\x0f\x43oncatParameter\x12\x0f\n\x04\x61xis\x18\x02 \x01(\x05:\x01\x31\x12\x15\n\nconcat_dim\x18\x01 \x01(\r:\x01\x31\"-\n\x18\x43ontrastiveLossParameter\x12\x11\n\x06margin\x18\x01 \x01(\x02:\x01\x31\"\xbf\x03\n\x14\x43onvolutionParameter\x12\x12\n\nnum_output\x18\x01 \x01(\r\x12\x17\n\tbias_term\x18\x02 \x01(\x08:\x04true\x12\x0e\n\x03pad\x18\x03 \x01(\r:\x01\x30\x12\x10\n\x05pad_h\x18\t \x01(\r:\x01\x30\x12\x10\n\x05pad_w\x18\n \x01(\r:\x01\x30\x12\x13\n\x0bkernel_size\x18\x04 \x01(\r\x12\x10\n\x08kernel_h\x18\x0b \x01(\r\x12\x10\n\x08kernel_w\x18\x0c \x01(\r\x12\x10\n\x05group\x18\x05 \x01(\r:\x01\x31\x12\x11\n\x06stride\x18\x06 \x01(\r:\x01\x31\x12\x10\n\x08stride_h\x18\r \x01(\r\x12\x10\n\x08stride_w\x18\x0e \x01(\r\x12-\n\rweight_filler\x18\x07 \x01(\x0b\x32\x16.caffe.FillerParameter\x12+\n\x0b\x62ias_filler\x18\x08 \x01(\x0b\x32\x16.caffe.FillerParameter\x12;\n\x06\x65ngine\x18\x0f \x01(\x0e\x32\".caffe.ConvolutionParameter.Engine:\x07\x44\x45\x46\x41ULT\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"\x8f\x02\n\rDataParameter\x12\x0e\n\x06source\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x04 \x01(\r\x12\x14\n\trand_skip\x18\x07 \x01(\r:\x01\x30\x12\x31\n\x07\x62\x61\x63kend\x18\x08 \x01(\x0e\x32\x17.caffe.DataParameter.DB:\x07LEVELDB\x12\x10\n\x05scale\x18\x02 \x01(\x02:\x01\x31\x12\x11\n\tmean_file\x18\x03 \x01(\t\x12\x14\n\tcrop_size\x18\x05 \x01(\r:\x01\x30\x12\x15\n\x06mirror\x18\x06 \x01(\x08:\x05\x66\x61lse\x12\"\n\x13\x66orce_encoded_color\x18\t \x01(\x08:\x05\x66\x61lse\"\x1b\n\x02\x44\x42\x12\x0b\n\x07LEVELDB\x10\x00\x12\x08\n\x04LMDB\x10\x01\".\n\x10\x44ropoutParameter\x12\x1a\n\rdropout_ratio\x18\x01 \x01(\x02:\x03\x30.5\"\xa0\x01\n\x12\x44ummyDataParameter\x12+\n\x0b\x64\x61ta_filler\x18\x01 \x03(\x0b\x32\x16.caffe.FillerParameter\x12\x1f\n\x05shape\x18\x06 \x03(\x0b\x32\x10.caffe.BlobShape\x12\x0b\n\x03num\x18\x02 \x03(\r\x12\x10\n\x08\x63hannels\x18\x03 \x03(\r\x12\x0e\n\x06height\x18\x04 \x03(\r\x12\r\n\x05width\x18\x05 \x03(\r\"\xa5\x01\n\x10\x45ltwiseParameter\x12\x39\n\toperation\x18\x01 \x01(\x0e\x32!.caffe.EltwiseParameter.EltwiseOp:\x03SUM\x12\r\n\x05\x63oeff\x18\x02 \x03(\x02\x12\x1e\n\x10stable_prod_grad\x18\x03 \x01(\x08:\x04true\"\'\n\tEltwiseOp\x12\x08\n\x04PROD\x10\x00\x12\x07\n\x03SUM\x10\x01\x12\x07\n\x03MAX\x10\x02\"D\n\x0c\x45xpParameter\x12\x10\n\x04\x62\x61se\x18\x01 \x01(\x02:\x02-1\x12\x10\n\x05scale\x18\x02 \x01(\x02:\x01\x31\x12\x10\n\x05shift\x18\x03 \x01(\x02:\x01\x30\"O\n\x11HDF5DataParameter\x12\x0e\n\x06source\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x02 \x01(\r\x12\x16\n\x07shuffle\x18\x03 \x01(\x08:\x05\x66\x61lse\"(\n\x13HDF5OutputParameter\x12\x11\n\tfile_name\x18\x01 \x01(\t\"^\n\x12HingeLossParameter\x12\x30\n\x04norm\x18\x01 \x01(\x0e\x32\x1e.caffe.HingeLossParameter.Norm:\x02L1\"\x16\n\x04Norm\x12\x06\n\x02L1\x10\x01\x12\x06\n\x02L2\x10\x02\"\x94\x02\n\x12ImageDataParameter\x12\x0e\n\x06source\x18\x01 \x01(\t\x12\x12\n\nbatch_size\x18\x04 \x01(\r\x12\x14\n\trand_skip\x18\x07 \x01(\r:\x01\x30\x12\x16\n\x07shuffle\x18\x08 \x01(\x08:\x05\x66\x61lse\x12\x15\n\nnew_height\x18\t \x01(\r:\x01\x30\x12\x14\n\tnew_width\x18\n \x01(\r:\x01\x30\x12\x16\n\x08is_color\x18\x0b \x01(\x08:\x04true\x12\x10\n\x05scale\x18\x02 \x01(\x02:\x01\x31\x12\x11\n\tmean_file\x18\x03 \x01(\t\x12\x14\n\tcrop_size\x18\x05 \x01(\r:\x01\x30\x12\x15\n\x06mirror\x18\x06 \x01(\x08:\x05\x66\x61lse\x12\x15\n\x0broot_folder\x18\x0c \x01(\t:\x00\"\'\n\x15InfogainLossParameter\x12\x0e\n\x06source\x18\x01 \x01(\t\"\xb1\x01\n\x15InnerProductParameter\x12\x12\n\nnum_output\x18\x01 \x01(\r\x12\x17\n\tbias_term\x18\x02 \x01(\x08:\x04true\x12-\n\rweight_filler\x18\x03 \x01(\x0b\x32\x16.caffe.FillerParameter\x12+\n\x0b\x62ias_filler\x18\x04 \x01(\x0b\x32\x16.caffe.FillerParameter\x12\x0f\n\x04\x61xis\x18\x05 \x01(\x05:\x01\x31\"\xd6\x01\n\x0cLRNParameter\x12\x15\n\nlocal_size\x18\x01 \x01(\r:\x01\x35\x12\x10\n\x05\x61lpha\x18\x02 \x01(\x02:\x01\x31\x12\x12\n\x04\x62\x65ta\x18\x03 \x01(\x02:\x04\x30.75\x12\x44\n\x0bnorm_region\x18\x04 \x01(\x0e\x32\x1e.caffe.LRNParameter.NormRegion:\x0f\x41\x43ROSS_CHANNELS\x12\x0c\n\x01k\x18\x05 \x01(\x02:\x01\x31\"5\n\nNormRegion\x12\x13\n\x0f\x41\x43ROSS_CHANNELS\x10\x00\x12\x12\n\x0eWITHIN_CHANNEL\x10\x01\"Z\n\x13MemoryDataParameter\x12\x12\n\nbatch_size\x18\x01 \x01(\r\x12\x10\n\x08\x63hannels\x18\x02 \x01(\r\x12\x0e\n\x06height\x18\x03 \x01(\r\x12\r\n\x05width\x18\x04 \x01(\r\"P\n\x0cMVNParameter\x12 \n\x12normalize_variance\x18\x01 \x01(\x08:\x04true\x12\x1e\n\x0f\x61\x63ross_channels\x18\x02 \x01(\x08:\x05\x66\x61lse\"\xa2\x03\n\x10PoolingParameter\x12\x35\n\x04pool\x18\x01 \x01(\x0e\x32\".caffe.PoolingParameter.PoolMethod:\x03MAX\x12\x0e\n\x03pad\x18\x04 \x01(\r:\x01\x30\x12\x10\n\x05pad_h\x18\t \x01(\r:\x01\x30\x12\x10\n\x05pad_w\x18\n \x01(\r:\x01\x30\x12\x13\n\x0bkernel_size\x18\x02 \x01(\r\x12\x10\n\x08kernel_h\x18\x05 \x01(\r\x12\x10\n\x08kernel_w\x18\x06 \x01(\r\x12\x11\n\x06stride\x18\x03 \x01(\r:\x01\x31\x12\x10\n\x08stride_h\x18\x07 \x01(\r\x12\x10\n\x08stride_w\x18\x08 \x01(\r\x12\x37\n\x06\x65ngine\x18\x0b \x01(\x0e\x32\x1e.caffe.PoolingParameter.Engine:\x07\x44\x45\x46\x41ULT\x12\x1d\n\x0eglobal_pooling\x18\x0c \x01(\x08:\x05\x66\x61lse\".\n\nPoolMethod\x12\x07\n\x03MAX\x10\x00\x12\x07\n\x03\x41VE\x10\x01\x12\x0e\n\nSTOCHASTIC\x10\x02\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"F\n\x0ePowerParameter\x12\x10\n\x05power\x18\x01 \x01(\x02:\x01\x31\x12\x10\n\x05scale\x18\x02 \x01(\x02:\x01\x31\x12\x10\n\x05shift\x18\x03 \x01(\x02:\x01\x30\"E\n\x0fPythonParameter\x12\x0e\n\x06module\x18\x01 \x01(\t\x12\r\n\x05layer\x18\x02 \x01(\t\x12\x13\n\tparam_str\x18\x03 \x01(\t:\x00\"\x8d\x01\n\rReLUParameter\x12\x19\n\x0enegative_slope\x18\x01 \x01(\x02:\x01\x30\x12\x34\n\x06\x65ngine\x18\x02 \x01(\x0e\x32\x1b.caffe.ReLUParameter.Engine:\x07\x44\x45\x46\x41ULT\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"Y\n\x13ROIPoolingParameter\x12\x13\n\x08pooled_h\x18\x01 \x01(\r:\x01\x30\x12\x13\n\x08pooled_w\x18\x02 \x01(\r:\x01\x30\x12\x18\n\rspatial_scale\x18\x03 \x01(\x02:\x01\x31\"x\n\x10SigmoidParameter\x12\x37\n\x06\x65ngine\x18\x01 \x01(\x0e\x32\x1e.caffe.SigmoidParameter.Engine:\x07\x44\x45\x46\x41ULT\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"L\n\x0eSliceParameter\x12\x0f\n\x04\x61xis\x18\x03 \x01(\x05:\x01\x31\x12\x13\n\x0bslice_point\x18\x02 \x03(\r\x12\x14\n\tslice_dim\x18\x01 \x01(\r:\x01\x31\"\x89\x01\n\x10SoftmaxParameter\x12\x37\n\x06\x65ngine\x18\x01 \x01(\x0e\x32\x1e.caffe.SoftmaxParameter.Engine:\x07\x44\x45\x46\x41ULT\x12\x0f\n\x04\x61xis\x18\x02 \x01(\x05:\x01\x31\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"r\n\rTanHParameter\x12\x34\n\x06\x65ngine\x18\x01 \x01(\x0e\x32\x1b.caffe.TanHParameter.Engine:\x07\x44\x45\x46\x41ULT\"+\n\x06\x45ngine\x12\x0b\n\x07\x44\x45\x46\x41ULT\x10\x00\x12\t\n\x05\x43\x41\x46\x46\x45\x10\x01\x12\t\n\x05\x43UDNN\x10\x02\"*\n\x12ThresholdParameter\x12\x14\n\tthreshold\x18\x01 \x01(\x02:\x01\x30\"\xc1\x02\n\x13WindowDataParameter\x12\x0e\n\x06source\x18\x01 \x01(\t\x12\x10\n\x05scale\x18\x02 \x01(\x02:\x01\x31\x12\x11\n\tmean_file\x18\x03 \x01(\t\x12\x12\n\nbatch_size\x18\x04 \x01(\r\x12\x14\n\tcrop_size\x18\x05 \x01(\r:\x01\x30\x12\x15\n\x06mirror\x18\x06 \x01(\x08:\x05\x66\x61lse\x12\x19\n\x0c\x66g_threshold\x18\x07 \x01(\x02:\x03\x30.5\x12\x19\n\x0c\x62g_threshold\x18\x08 \x01(\x02:\x03\x30.5\x12\x19\n\x0b\x66g_fraction\x18\t \x01(\x02:\x04\x30.25\x12\x16\n\x0b\x63ontext_pad\x18\n \x01(\r:\x01\x30\x12\x17\n\tcrop_mode\x18\x0b \x01(\t:\x04warp\x12\x1b\n\x0c\x63\x61\x63he_images\x18\x0c \x01(\x08:\x05\x66\x61lse\x12\x15\n\x0broot_folder\x18\r \x01(\t:\x00\"\xe0\x13\n\x10V1LayerParameter\x12\x0e\n\x06\x62ottom\x18\x02 \x03(\t\x12\x0b\n\x03top\x18\x03 \x03(\t\x12\x0c\n\x04name\x18\x04 \x01(\t\x12$\n\x07include\x18  \x03(\x0b\x32\x13.caffe.NetStateRule\x12$\n\x07\x65xclude\x18! \x03(\x0b\x32\x13.caffe.NetStateRule\x12/\n\x04type\x18\x05 \x01(\x0e\x32!.caffe.V1LayerParameter.LayerType\x12\x1f\n\x05\x62lobs\x18\x06 \x03(\x0b\x32\x10.caffe.BlobProto\x12\x0e\n\x05param\x18\xe9\x07 \x03(\t\x12>\n\x0f\x62lob_share_mode\x18\xea\x07 \x03(\x0e\x32$.caffe.V1LayerParameter.DimCheckMode\x12\x10\n\x08\x62lobs_lr\x18\x07 \x03(\x02\x12\x14\n\x0cweight_decay\x18\x08 \x03(\x02\x12\x13\n\x0bloss_weight\x18# \x03(\x02\x12\x30\n\x0e\x61\x63\x63uracy_param\x18\x1b \x01(\x0b\x32\x18.caffe.AccuracyParameter\x12,\n\x0c\x61rgmax_param\x18\x17 \x01(\x0b\x32\x16.caffe.ArgMaxParameter\x12,\n\x0c\x63oncat_param\x18\t \x01(\x0b\x32\x16.caffe.ConcatParameter\x12?\n\x16\x63ontrastive_loss_param\x18( \x01(\x0b\x32\x1f.caffe.ContrastiveLossParameter\x12\x36\n\x11\x63onvolution_param\x18\n \x01(\x0b\x32\x1b.caffe.ConvolutionParameter\x12(\n\ndata_param\x18\x0b \x01(\x0b\x32\x14.caffe.DataParameter\x12.\n\rdropout_param\x18\x0c \x01(\x0b\x32\x17.caffe.DropoutParameter\x12\x33\n\x10\x64ummy_data_param\x18\x1a \x01(\x0b\x32\x19.caffe.DummyDataParameter\x12.\n\reltwise_param\x18\x18 \x01(\x0b\x32\x17.caffe.EltwiseParameter\x12&\n\texp_param\x18) \x01(\x0b\x32\x13.caffe.ExpParameter\x12\x31\n\x0fhdf5_data_param\x18\r \x01(\x0b\x32\x18.caffe.HDF5DataParameter\x12\x35\n\x11hdf5_output_param\x18\x0e \x01(\x0b\x32\x1a.caffe.HDF5OutputParameter\x12\x33\n\x10hinge_loss_param\x18\x1d \x01(\x0b\x32\x19.caffe.HingeLossParameter\x12\x33\n\x10image_data_param\x18\x0f \x01(\x0b\x32\x19.caffe.ImageDataParameter\x12\x39\n\x13infogain_loss_param\x18\x10 \x01(\x0b\x32\x1c.caffe.InfogainLossParameter\x12\x39\n\x13inner_product_param\x18\x11 \x01(\x0b\x32\x1c.caffe.InnerProductParameter\x12&\n\tlrn_param\x18\x12 \x01(\x0b\x32\x13.caffe.LRNParameter\x12\x35\n\x11memory_data_param\x18\x16 \x01(\x0b\x32\x1a.caffe.MemoryDataParameter\x12&\n\tmvn_param\x18\" \x01(\x0b\x32\x13.caffe.MVNParameter\x12.\n\rpooling_param\x18\x13 \x01(\x0b\x32\x17.caffe.PoolingParameter\x12*\n\x0bpower_param\x18\x15 \x01(\x0b\x32\x15.caffe.PowerParameter\x12(\n\nrelu_param\x18\x1e \x01(\x0b\x32\x14.caffe.ReLUParameter\x12.\n\rsigmoid_param\x18& \x01(\x0b\x32\x17.caffe.SigmoidParameter\x12.\n\rsoftmax_param\x18\' \x01(\x0b\x32\x17.caffe.SoftmaxParameter\x12*\n\x0bslice_param\x18\x1f \x01(\x0b\x32\x15.caffe.SliceParameter\x12(\n\ntanh_param\x18% \x01(\x0b\x32\x14.caffe.TanHParameter\x12\x32\n\x0fthreshold_param\x18\x19 \x01(\x0b\x32\x19.caffe.ThresholdParameter\x12\x35\n\x11window_data_param\x18\x14 \x01(\x0b\x32\x1a.caffe.WindowDataParameter\x12\x37\n\x0ftransform_param\x18$ \x01(\x0b\x32\x1e.caffe.TransformationParameter\x12(\n\nloss_param\x18* \x01(\x0b\x32\x14.caffe.LossParameter\x12&\n\x05layer\x18\x01 \x01(\x0b\x32\x17.caffe.V0LayerParameter\"\xd8\x04\n\tLayerType\x12\x08\n\x04NONE\x10\x00\x12\n\n\x06\x41\x42SVAL\x10#\x12\x0c\n\x08\x41\x43\x43URACY\x10\x01\x12\n\n\x06\x41RGMAX\x10\x1e\x12\x08\n\x04\x42NLL\x10\x02\x12\n\n\x06\x43ONCAT\x10\x03\x12\x14\n\x10\x43ONTRASTIVE_LOSS\x10%\x12\x0f\n\x0b\x43ONVOLUTION\x10\x04\x12\x08\n\x04\x44\x41TA\x10\x05\x12\x11\n\rDECONVOLUTION\x10\'\x12\x0b\n\x07\x44ROPOUT\x10\x06\x12\x0e\n\nDUMMY_DATA\x10 \x12\x12\n\x0e\x45UCLIDEAN_LOSS\x10\x07\x12\x0b\n\x07\x45LTWISE\x10\x19\x12\x07\n\x03\x45XP\x10&\x12\x0b\n\x07\x46LATTEN\x10\x08\x12\r\n\tHDF5_DATA\x10\t\x12\x0f\n\x0bHDF5_OUTPUT\x10\n\x12\x0e\n\nHINGE_LOSS\x10\x1c\x12\n\n\x06IM2COL\x10\x0b\x12\x0e\n\nIMAGE_DATA\x10\x0c\x12\x11\n\rINFOGAIN_LOSS\x10\r\x12\x11\n\rINNER_PRODUCT\x10\x0e\x12\x07\n\x03LRN\x10\x0f\x12\x0f\n\x0bMEMORY_DATA\x10\x1d\x12\x1d\n\x19MULTINOMIAL_LOGISTIC_LOSS\x10\x10\x12\x07\n\x03MVN\x10\"\x12\x0b\n\x07POOLING\x10\x11\x12\t\n\x05POWER\x10\x1a\x12\x08\n\x04RELU\x10\x12\x12\x0b\n\x07SIGMOID\x10\x13\x12\x1e\n\x1aSIGMOID_CROSS_ENTROPY_LOSS\x10\x1b\x12\x0b\n\x07SILENCE\x10$\x12\x0b\n\x07SOFTMAX\x10\x14\x12\x10\n\x0cSOFTMAX_LOSS\x10\x15\x12\t\n\x05SPLIT\x10\x16\x12\t\n\x05SLICE\x10!\x12\x08\n\x04TANH\x10\x17\x12\x0f\n\x0bWINDOW_DATA\x10\x18\x12\r\n\tTHRESHOLD\x10\x1f\"*\n\x0c\x44imCheckMode\x12\n\n\x06STRICT\x10\x00\x12\x0e\n\nPERMISSIVE\x10\x01\"\xfd\x07\n\x10V0LayerParameter\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t\x12\x12\n\nnum_output\x18\x03 \x01(\r\x12\x16\n\x08\x62iasterm\x18\x04 \x01(\x08:\x04true\x12-\n\rweight_filler\x18\x05 \x01(\x0b\x32\x16.caffe.FillerParameter\x12+\n\x0b\x62ias_filler\x18\x06 \x01(\x0b\x32\x16.caffe.FillerParameter\x12\x0e\n\x03pad\x18\x07 \x01(\r:\x01\x30\x12\x12\n\nkernelsize\x18\x08 \x01(\r\x12\x10\n\x05group\x18\t \x01(\r:\x01\x31\x12\x11\n\x06stride\x18\n \x01(\r:\x01\x31\x12\x35\n\x04pool\x18\x0b \x01(\x0e\x32\".caffe.V0LayerParameter.PoolMethod:\x03MAX\x12\x1a\n\rdropout_ratio\x18\x0c \x01(\x02:\x03\x30.5\x12\x15\n\nlocal_size\x18\r \x01(\r:\x01\x35\x12\x10\n\x05\x61lpha\x18\x0e \x01(\x02:\x01\x31\x12\x12\n\x04\x62\x65ta\x18\x0f \x01(\x02:\x04\x30.75\x12\x0c\n\x01k\x18\x16 \x01(\x02:\x01\x31\x12\x0e\n\x06source\x18\x10 \x01(\t\x12\x10\n\x05scale\x18\x11 \x01(\x02:\x01\x31\x12\x10\n\x08meanfile\x18\x12 \x01(\t\x12\x11\n\tbatchsize\x18\x13 \x01(\r\x12\x13\n\x08\x63ropsize\x18\x14 \x01(\r:\x01\x30\x12\x15\n\x06mirror\x18\x15 \x01(\x08:\x05\x66\x61lse\x12\x1f\n\x05\x62lobs\x18\x32 \x03(\x0b\x32\x10.caffe.BlobProto\x12\x10\n\x08\x62lobs_lr\x18\x33 \x03(\x02\x12\x14\n\x0cweight_decay\x18\x34 \x03(\x02\x12\x14\n\trand_skip\x18\x35 \x01(\r:\x01\x30\x12\x1d\n\x10\x64\x65t_fg_threshold\x18\x36 \x01(\x02:\x03\x30.5\x12\x1d\n\x10\x64\x65t_bg_threshold\x18\x37 \x01(\x02:\x03\x30.5\x12\x1d\n\x0f\x64\x65t_fg_fraction\x18\x38 \x01(\x02:\x04\x30.25\x12\x1a\n\x0f\x64\x65t_context_pad\x18: \x01(\r:\x01\x30\x12\x1b\n\rdet_crop_mode\x18; \x01(\t:\x04warp\x12\x12\n\x07new_num\x18< \x01(\x05:\x01\x30\x12\x17\n\x0cnew_channels\x18= \x01(\x05:\x01\x30\x12\x15\n\nnew_height\x18> \x01(\x05:\x01\x30\x12\x14\n\tnew_width\x18? \x01(\x05:\x01\x30\x12\x1d\n\x0eshuffle_images\x18@ \x01(\x08:\x05\x66\x61lse\x12\x15\n\nconcat_dim\x18\x41 \x01(\r:\x01\x31\x12\x36\n\x11hdf5_output_param\x18\xe9\x07 \x01(\x0b\x32\x1a.caffe.HDF5OutputParameter\".\n\nPoolMethod\x12\x07\n\x03MAX\x10\x00\x12\x07\n\x03\x41VE\x10\x01\x12\x0e\n\nSTOCHASTIC\x10\x02\"W\n\x0ePReLUParameter\x12&\n\x06\x66iller\x18\x01 \x01(\x0b\x32\x16.caffe.FillerParameter\x12\x1d\n\x0e\x63hannel_shared\x18\x02 \x01(\x08:\x05\x66\x61lse*\x1c\n\x05Phase\x12\t\n\x05TRAIN\x10\x00\x12\x08\n\x04TEST\x10\x01')
+
+_PHASE = _descriptor.EnumDescriptor(
+  name='Phase',
+  full_name='caffe.Phase',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='TRAIN', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='TEST', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=12254,
+  serialized_end=12282,
+)
+
+Phase = enum_type_wrapper.EnumTypeWrapper(_PHASE)
+TRAIN = 0
+TEST = 1
+
+
+_SOLVERPARAMETER_SOLVERMODE = _descriptor.EnumDescriptor(
+  name='SolverMode',
+  full_name='caffe.SolverParameter.SolverMode',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='CPU', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='GPU', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=1806,
+  serialized_end=1836,
+)
+
+_SOLVERPARAMETER_SOLVERTYPE = _descriptor.EnumDescriptor(
+  name='SolverType',
+  full_name='caffe.SolverParameter.SolverType',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='SGD', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='NESTEROV', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='ADAGRAD', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=1838,
+  serialized_end=1886,
+)
+
+_PARAMSPEC_DIMCHECKMODE = _descriptor.EnumDescriptor(
+  name='DimCheckMode',
+  full_name='caffe.ParamSpec.DimCheckMode',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='STRICT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='PERMISSIVE', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=2317,
+  serialized_end=2359,
+)
+
+_CONVOLUTIONPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.ConvolutionParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_DATAPARAMETER_DB = _descriptor.EnumDescriptor(
+  name='DB',
+  full_name='caffe.DataParameter.DB',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='LEVELDB', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='LMDB', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5399,
+  serialized_end=5426,
+)
+
+_ELTWISEPARAMETER_ELTWISEOP = _descriptor.EnumDescriptor(
+  name='EltwiseOp',
+  full_name='caffe.EltwiseParameter.EltwiseOp',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='PROD', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SUM', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='MAX', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5766,
+  serialized_end=5805,
+)
+
+_HINGELOSSPARAMETER_NORM = _descriptor.EnumDescriptor(
+  name='Norm',
+  full_name='caffe.HingeLossParameter.Norm',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='L1', index=0, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='L2', index=1, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=6072,
+  serialized_end=6094,
+)
+
+_LRNPARAMETER_NORMREGION = _descriptor.EnumDescriptor(
+  name='NormRegion',
+  full_name='caffe.LRNParameter.NormRegion',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='ACROSS_CHANNELS', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='WITHIN_CHANNEL', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=6758,
+  serialized_end=6811,
+)
+
+_POOLINGPARAMETER_POOLMETHOD = _descriptor.EnumDescriptor(
+  name='PoolMethod',
+  full_name='caffe.PoolingParameter.PoolMethod',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='MAX', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='AVE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='STOCHASTIC', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=7315,
+  serialized_end=7361,
+)
+
+_POOLINGPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.PoolingParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_RELUPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.ReLUParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_SIGMOIDPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.SigmoidParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_SOFTMAXPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.SoftmaxParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_TANHPARAMETER_ENGINE = _descriptor.EnumDescriptor(
+  name='Engine',
+  full_name='caffe.TanHParameter.Engine',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='DEFAULT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CAFFE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CUDNN', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=5109,
+  serialized_end=5152,
+)
+
+_V1LAYERPARAMETER_LAYERTYPE = _descriptor.EnumDescriptor(
+  name='LayerType',
+  full_name='caffe.V1LayerParameter.LayerType',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='NONE', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='ABSVAL', index=1, number=35,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='ACCURACY', index=2, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='ARGMAX', index=3, number=30,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='BNLL', index=4, number=2,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CONCAT', index=5, number=3,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CONTRASTIVE_LOSS', index=6, number=37,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='CONVOLUTION', index=7, number=4,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='DATA', index=8, number=5,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='DECONVOLUTION', index=9, number=39,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='DROPOUT', index=10, number=6,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='DUMMY_DATA', index=11, number=32,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='EUCLIDEAN_LOSS', index=12, number=7,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='ELTWISE', index=13, number=25,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='EXP', index=14, number=38,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='FLATTEN', index=15, number=8,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='HDF5_DATA', index=16, number=9,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='HDF5_OUTPUT', index=17, number=10,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='HINGE_LOSS', index=18, number=28,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='IM2COL', index=19, number=11,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='IMAGE_DATA', index=20, number=12,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='INFOGAIN_LOSS', index=21, number=13,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='INNER_PRODUCT', index=22, number=14,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='LRN', index=23, number=15,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='MEMORY_DATA', index=24, number=29,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='MULTINOMIAL_LOGISTIC_LOSS', index=25, number=16,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='MVN', index=26, number=34,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='POOLING', index=27, number=17,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='POWER', index=28, number=26,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='RELU', index=29, number=18,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SIGMOID', index=30, number=19,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SIGMOID_CROSS_ENTROPY_LOSS', index=31, number=27,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SILENCE', index=32, number=36,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SOFTMAX', index=33, number=20,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SOFTMAX_LOSS', index=34, number=21,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SPLIT', index=35, number=22,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='SLICE', index=36, number=33,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='TANH', index=37, number=23,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='WINDOW_DATA', index=38, number=24,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='THRESHOLD', index=39, number=31,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=10495,
+  serialized_end=11095,
+)
+
+_V1LAYERPARAMETER_DIMCHECKMODE = _descriptor.EnumDescriptor(
+  name='DimCheckMode',
+  full_name='caffe.V1LayerParameter.DimCheckMode',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='STRICT', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='PERMISSIVE', index=1, number=1,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=2317,
+  serialized_end=2359,
+)
+
+_V0LAYERPARAMETER_POOLMETHOD = _descriptor.EnumDescriptor(
+  name='PoolMethod',
+  full_name='caffe.V0LayerParameter.PoolMethod',
+  filename=None,
+  file=DESCRIPTOR,
+  values=[
+    _descriptor.EnumValueDescriptor(
+      name='MAX', index=0, number=0,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='AVE', index=1, number=1,
+      options=None,
+      type=None),
+    _descriptor.EnumValueDescriptor(
+      name='STOCHASTIC', index=2, number=2,
+      options=None,
+      type=None),
+  ],
+  containing_type=None,
+  options=None,
+  serialized_start=7315,
+  serialized_end=7361,
+)
+
+
+_BLOBSHAPE = _descriptor.Descriptor(
+  name='BlobShape',
+  full_name='caffe.BlobShape',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='dim', full_name='caffe.BlobShape.dim', index=0,
+      number=1, type=3, cpp_type=2, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=31,
+  serialized_end=59,
+)
+
+
+_BLOBPROTO = _descriptor.Descriptor(
+  name='BlobProto',
+  full_name='caffe.BlobProto',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='shape', full_name='caffe.BlobProto.shape', index=0,
+      number=7, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='data', full_name='caffe.BlobProto.data', index=1,
+      number=5, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')),
+    _descriptor.FieldDescriptor(
+      name='diff', full_name='caffe.BlobProto.diff', index=2,
+      number=6, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=_descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')),
+    _descriptor.FieldDescriptor(
+      name='num', full_name='caffe.BlobProto.num', index=3,
+      number=1, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='channels', full_name='caffe.BlobProto.channels', index=4,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='height', full_name='caffe.BlobProto.height', index=5,
+      number=3, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='width', full_name='caffe.BlobProto.width', index=6,
+      number=4, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=62,
+  serialized_end=216,
+)
+
+
+_BLOBPROTOVECTOR = _descriptor.Descriptor(
+  name='BlobProtoVector',
+  full_name='caffe.BlobProtoVector',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='blobs', full_name='caffe.BlobProtoVector.blobs', index=0,
+      number=1, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=218,
+  serialized_end=268,
+)
+
+
+_DATUM = _descriptor.Descriptor(
+  name='Datum',
+  full_name='caffe.Datum',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='channels', full_name='caffe.Datum.channels', index=0,
+      number=1, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='height', full_name='caffe.Datum.height', index=1,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='width', full_name='caffe.Datum.width', index=2,
+      number=3, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='data', full_name='caffe.Datum.data', index=3,
+      number=4, type=12, cpp_type=9, label=1,
+      has_default_value=False, default_value="",
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='label', full_name='caffe.Datum.label', index=4,
+      number=5, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='float_data', full_name='caffe.Datum.float_data', index=5,
+      number=6, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='encoded', full_name='caffe.Datum.encoded', index=6,
+      number=7, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=271,
+  serialized_end=400,
+)
+
+
+_FILLERPARAMETER = _descriptor.Descriptor(
+  name='FillerParameter',
+  full_name='caffe.FillerParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='type', full_name='caffe.FillerParameter.type', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("constant", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='value', full_name='caffe.FillerParameter.value', index=1,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='min', full_name='caffe.FillerParameter.min', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='max', full_name='caffe.FillerParameter.max', index=3,
+      number=4, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean', full_name='caffe.FillerParameter.mean', index=4,
+      number=5, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='std', full_name='caffe.FillerParameter.std', index=5,
+      number=6, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='sparse', full_name='caffe.FillerParameter.sparse', index=6,
+      number=7, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=-1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=403,
+  serialized_end=547,
+)
+
+
+_NETPARAMETER = _descriptor.Descriptor(
+  name='NetParameter',
+  full_name='caffe.NetParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='name', full_name='caffe.NetParameter.name', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='input', full_name='caffe.NetParameter.input', index=1,
+      number=3, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='input_shape', full_name='caffe.NetParameter.input_shape', index=2,
+      number=8, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='input_dim', full_name='caffe.NetParameter.input_dim', index=3,
+      number=4, type=5, cpp_type=1, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='force_backward', full_name='caffe.NetParameter.force_backward', index=4,
+      number=5, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='state', full_name='caffe.NetParameter.state', index=5,
+      number=6, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='debug_info', full_name='caffe.NetParameter.debug_info', index=6,
+      number=7, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='layer', full_name='caffe.NetParameter.layer', index=7,
+      number=100, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='layers', full_name='caffe.NetParameter.layers', index=8,
+      number=2, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=550,
+  serialized_end=820,
+)
+
+
+_SOLVERPARAMETER = _descriptor.Descriptor(
+  name='SolverParameter',
+  full_name='caffe.SolverParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='net', full_name='caffe.SolverParameter.net', index=0,
+      number=24, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='net_param', full_name='caffe.SolverParameter.net_param', index=1,
+      number=25, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='train_net', full_name='caffe.SolverParameter.train_net', index=2,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_net', full_name='caffe.SolverParameter.test_net', index=3,
+      number=2, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='train_net_param', full_name='caffe.SolverParameter.train_net_param', index=4,
+      number=21, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_net_param', full_name='caffe.SolverParameter.test_net_param', index=5,
+      number=22, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='train_state', full_name='caffe.SolverParameter.train_state', index=6,
+      number=26, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_state', full_name='caffe.SolverParameter.test_state', index=7,
+      number=27, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_iter', full_name='caffe.SolverParameter.test_iter', index=8,
+      number=3, type=5, cpp_type=1, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_interval', full_name='caffe.SolverParameter.test_interval', index=9,
+      number=4, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_compute_loss', full_name='caffe.SolverParameter.test_compute_loss', index=10,
+      number=19, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='test_initialization', full_name='caffe.SolverParameter.test_initialization', index=11,
+      number=32, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='base_lr', full_name='caffe.SolverParameter.base_lr', index=12,
+      number=5, type=2, cpp_type=6, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='display', full_name='caffe.SolverParameter.display', index=13,
+      number=6, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='average_loss', full_name='caffe.SolverParameter.average_loss', index=14,
+      number=33, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='max_iter', full_name='caffe.SolverParameter.max_iter', index=15,
+      number=7, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='lr_policy', full_name='caffe.SolverParameter.lr_policy', index=16,
+      number=8, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='gamma', full_name='caffe.SolverParameter.gamma', index=17,
+      number=9, type=2, cpp_type=6, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='power', full_name='caffe.SolverParameter.power', index=18,
+      number=10, type=2, cpp_type=6, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='momentum', full_name='caffe.SolverParameter.momentum', index=19,
+      number=11, type=2, cpp_type=6, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_decay', full_name='caffe.SolverParameter.weight_decay', index=20,
+      number=12, type=2, cpp_type=6, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='regularization_type', full_name='caffe.SolverParameter.regularization_type', index=21,
+      number=29, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("L2", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stepsize', full_name='caffe.SolverParameter.stepsize', index=22,
+      number=13, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stepvalue', full_name='caffe.SolverParameter.stepvalue', index=23,
+      number=34, type=5, cpp_type=1, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='clip_gradients', full_name='caffe.SolverParameter.clip_gradients', index=24,
+      number=35, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=-1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='snapshot', full_name='caffe.SolverParameter.snapshot', index=25,
+      number=14, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='snapshot_prefix', full_name='caffe.SolverParameter.snapshot_prefix', index=26,
+      number=15, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='snapshot_diff', full_name='caffe.SolverParameter.snapshot_diff', index=27,
+      number=16, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='solver_mode', full_name='caffe.SolverParameter.solver_mode', index=28,
+      number=17, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='device_id', full_name='caffe.SolverParameter.device_id', index=29,
+      number=18, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='random_seed', full_name='caffe.SolverParameter.random_seed', index=30,
+      number=20, type=3, cpp_type=2, label=1,
+      has_default_value=True, default_value=-1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='solver_type', full_name='caffe.SolverParameter.solver_type', index=31,
+      number=30, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='delta', full_name='caffe.SolverParameter.delta', index=32,
+      number=31, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1e-08,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='debug_info', full_name='caffe.SolverParameter.debug_info', index=33,
+      number=23, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='snapshot_after_train', full_name='caffe.SolverParameter.snapshot_after_train', index=34,
+      number=28, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _SOLVERPARAMETER_SOLVERMODE,
+    _SOLVERPARAMETER_SOLVERTYPE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=823,
+  serialized_end=1886,
+)
+
+
+_SOLVERSTATE = _descriptor.Descriptor(
+  name='SolverState',
+  full_name='caffe.SolverState',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='iter', full_name='caffe.SolverState.iter', index=0,
+      number=1, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='learned_net', full_name='caffe.SolverState.learned_net', index=1,
+      number=2, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='history', full_name='caffe.SolverState.history', index=2,
+      number=3, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='current_step', full_name='caffe.SolverState.current_step', index=3,
+      number=4, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=1888,
+  serialized_end=1996,
+)
+
+
+_NETSTATE = _descriptor.Descriptor(
+  name='NetState',
+  full_name='caffe.NetState',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='phase', full_name='caffe.NetState.phase', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='level', full_name='caffe.NetState.level', index=1,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stage', full_name='caffe.NetState.stage', index=2,
+      number=3, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=1998,
+  serialized_end=2076,
+)
+
+
+_NETSTATERULE = _descriptor.Descriptor(
+  name='NetStateRule',
+  full_name='caffe.NetStateRule',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='phase', full_name='caffe.NetStateRule.phase', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='min_level', full_name='caffe.NetStateRule.min_level', index=1,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='max_level', full_name='caffe.NetStateRule.max_level', index=2,
+      number=3, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stage', full_name='caffe.NetStateRule.stage', index=3,
+      number=4, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='not_stage', full_name='caffe.NetStateRule.not_stage', index=4,
+      number=5, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=2078,
+  serialized_end=2193,
+)
+
+
+_PARAMSPEC = _descriptor.Descriptor(
+  name='ParamSpec',
+  full_name='caffe.ParamSpec',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='name', full_name='caffe.ParamSpec.name', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='share_mode', full_name='caffe.ParamSpec.share_mode', index=1,
+      number=2, type=14, cpp_type=8, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='lr_mult', full_name='caffe.ParamSpec.lr_mult', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='decay_mult', full_name='caffe.ParamSpec.decay_mult', index=3,
+      number=4, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _PARAMSPEC_DIMCHECKMODE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=2196,
+  serialized_end=2359,
+)
+
+
+_LAYERPARAMETER = _descriptor.Descriptor(
+  name='LayerParameter',
+  full_name='caffe.LayerParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='name', full_name='caffe.LayerParameter.name', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='type', full_name='caffe.LayerParameter.type', index=1,
+      number=2, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bottom', full_name='caffe.LayerParameter.bottom', index=2,
+      number=3, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='top', full_name='caffe.LayerParameter.top', index=3,
+      number=4, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='phase', full_name='caffe.LayerParameter.phase', index=4,
+      number=10, type=14, cpp_type=8, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='loss_weight', full_name='caffe.LayerParameter.loss_weight', index=5,
+      number=5, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='param', full_name='caffe.LayerParameter.param', index=6,
+      number=6, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blobs', full_name='caffe.LayerParameter.blobs', index=7,
+      number=7, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='include', full_name='caffe.LayerParameter.include', index=8,
+      number=8, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='exclude', full_name='caffe.LayerParameter.exclude', index=9,
+      number=9, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='transform_param', full_name='caffe.LayerParameter.transform_param', index=10,
+      number=100, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='loss_param', full_name='caffe.LayerParameter.loss_param', index=11,
+      number=101, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='accuracy_param', full_name='caffe.LayerParameter.accuracy_param', index=12,
+      number=102, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='argmax_param', full_name='caffe.LayerParameter.argmax_param', index=13,
+      number=103, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='concat_param', full_name='caffe.LayerParameter.concat_param', index=14,
+      number=104, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='contrastive_loss_param', full_name='caffe.LayerParameter.contrastive_loss_param', index=15,
+      number=105, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='convolution_param', full_name='caffe.LayerParameter.convolution_param', index=16,
+      number=106, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='data_param', full_name='caffe.LayerParameter.data_param', index=17,
+      number=107, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='dropout_param', full_name='caffe.LayerParameter.dropout_param', index=18,
+      number=108, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='dummy_data_param', full_name='caffe.LayerParameter.dummy_data_param', index=19,
+      number=109, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='eltwise_param', full_name='caffe.LayerParameter.eltwise_param', index=20,
+      number=110, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='exp_param', full_name='caffe.LayerParameter.exp_param', index=21,
+      number=111, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hdf5_data_param', full_name='caffe.LayerParameter.hdf5_data_param', index=22,
+      number=112, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hdf5_output_param', full_name='caffe.LayerParameter.hdf5_output_param', index=23,
+      number=113, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hinge_loss_param', full_name='caffe.LayerParameter.hinge_loss_param', index=24,
+      number=114, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='image_data_param', full_name='caffe.LayerParameter.image_data_param', index=25,
+      number=115, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='infogain_loss_param', full_name='caffe.LayerParameter.infogain_loss_param', index=26,
+      number=116, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='inner_product_param', full_name='caffe.LayerParameter.inner_product_param', index=27,
+      number=117, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='lrn_param', full_name='caffe.LayerParameter.lrn_param', index=28,
+      number=118, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='memory_data_param', full_name='caffe.LayerParameter.memory_data_param', index=29,
+      number=119, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mvn_param', full_name='caffe.LayerParameter.mvn_param', index=30,
+      number=120, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pooling_param', full_name='caffe.LayerParameter.pooling_param', index=31,
+      number=121, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='power_param', full_name='caffe.LayerParameter.power_param', index=32,
+      number=122, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='prelu_param', full_name='caffe.LayerParameter.prelu_param', index=33,
+      number=131, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='python_param', full_name='caffe.LayerParameter.python_param', index=34,
+      number=130, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='relu_param', full_name='caffe.LayerParameter.relu_param', index=35,
+      number=123, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='roi_pooling_param', full_name='caffe.LayerParameter.roi_pooling_param', index=36,
+      number=8266711, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='sigmoid_param', full_name='caffe.LayerParameter.sigmoid_param', index=37,
+      number=124, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='softmax_param', full_name='caffe.LayerParameter.softmax_param', index=38,
+      number=125, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='slice_param', full_name='caffe.LayerParameter.slice_param', index=39,
+      number=126, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='tanh_param', full_name='caffe.LayerParameter.tanh_param', index=40,
+      number=127, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='threshold_param', full_name='caffe.LayerParameter.threshold_param', index=41,
+      number=128, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='window_data_param', full_name='caffe.LayerParameter.window_data_param', index=42,
+      number=129, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=2362,
+  serialized_end=4260,
+)
+
+
+_TRANSFORMATIONPARAMETER = _descriptor.Descriptor(
+  name='TransformationParameter',
+  full_name='caffe.TransformationParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.TransformationParameter.scale', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mirror', full_name='caffe.TransformationParameter.mirror', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='crop_size', full_name='caffe.TransformationParameter.crop_size', index=2,
+      number=3, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean_file', full_name='caffe.TransformationParameter.mean_file', index=3,
+      number=4, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean_value', full_name='caffe.TransformationParameter.mean_value', index=4,
+      number=5, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4262,
+  serialized_end=4389,
+)
+
+
+_LOSSPARAMETER = _descriptor.Descriptor(
+  name='LossParameter',
+  full_name='caffe.LossParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='ignore_label', full_name='caffe.LossParameter.ignore_label', index=0,
+      number=1, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='normalize', full_name='caffe.LossParameter.normalize', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4391,
+  serialized_end=4453,
+)
+
+
+_ACCURACYPARAMETER = _descriptor.Descriptor(
+  name='AccuracyParameter',
+  full_name='caffe.AccuracyParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='top_k', full_name='caffe.AccuracyParameter.top_k', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='axis', full_name='caffe.AccuracyParameter.axis', index=1,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='ignore_label', full_name='caffe.AccuracyParameter.ignore_label', index=2,
+      number=3, type=5, cpp_type=1, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4455,
+  serialized_end=4531,
+)
+
+
+_ARGMAXPARAMETER = _descriptor.Descriptor(
+  name='ArgMaxParameter',
+  full_name='caffe.ArgMaxParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='out_max_val', full_name='caffe.ArgMaxParameter.out_max_val', index=0,
+      number=1, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='top_k', full_name='caffe.ArgMaxParameter.top_k', index=1,
+      number=2, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4533,
+  serialized_end=4596,
+)
+
+
+_CONCATPARAMETER = _descriptor.Descriptor(
+  name='ConcatParameter',
+  full_name='caffe.ConcatParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='axis', full_name='caffe.ConcatParameter.axis', index=0,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='concat_dim', full_name='caffe.ConcatParameter.concat_dim', index=1,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4598,
+  serialized_end=4655,
+)
+
+
+_CONTRASTIVELOSSPARAMETER = _descriptor.Descriptor(
+  name='ContrastiveLossParameter',
+  full_name='caffe.ContrastiveLossParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='margin', full_name='caffe.ContrastiveLossParameter.margin', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4657,
+  serialized_end=4702,
+)
+
+
+_CONVOLUTIONPARAMETER = _descriptor.Descriptor(
+  name='ConvolutionParameter',
+  full_name='caffe.ConvolutionParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='num_output', full_name='caffe.ConvolutionParameter.num_output', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bias_term', full_name='caffe.ConvolutionParameter.bias_term', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad', full_name='caffe.ConvolutionParameter.pad', index=2,
+      number=3, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad_h', full_name='caffe.ConvolutionParameter.pad_h', index=3,
+      number=9, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad_w', full_name='caffe.ConvolutionParameter.pad_w', index=4,
+      number=10, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_size', full_name='caffe.ConvolutionParameter.kernel_size', index=5,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_h', full_name='caffe.ConvolutionParameter.kernel_h', index=6,
+      number=11, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_w', full_name='caffe.ConvolutionParameter.kernel_w', index=7,
+      number=12, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='group', full_name='caffe.ConvolutionParameter.group', index=8,
+      number=5, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride', full_name='caffe.ConvolutionParameter.stride', index=9,
+      number=6, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride_h', full_name='caffe.ConvolutionParameter.stride_h', index=10,
+      number=13, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride_w', full_name='caffe.ConvolutionParameter.stride_w', index=11,
+      number=14, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_filler', full_name='caffe.ConvolutionParameter.weight_filler', index=12,
+      number=7, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bias_filler', full_name='caffe.ConvolutionParameter.bias_filler', index=13,
+      number=8, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.ConvolutionParameter.engine', index=14,
+      number=15, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _CONVOLUTIONPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=4705,
+  serialized_end=5152,
+)
+
+
+_DATAPARAMETER = _descriptor.Descriptor(
+  name='DataParameter',
+  full_name='caffe.DataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.DataParameter.source', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='batch_size', full_name='caffe.DataParameter.batch_size', index=1,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='rand_skip', full_name='caffe.DataParameter.rand_skip', index=2,
+      number=7, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='backend', full_name='caffe.DataParameter.backend', index=3,
+      number=8, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.DataParameter.scale', index=4,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean_file', full_name='caffe.DataParameter.mean_file', index=5,
+      number=3, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='crop_size', full_name='caffe.DataParameter.crop_size', index=6,
+      number=5, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mirror', full_name='caffe.DataParameter.mirror', index=7,
+      number=6, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='force_encoded_color', full_name='caffe.DataParameter.force_encoded_color', index=8,
+      number=9, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _DATAPARAMETER_DB,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5155,
+  serialized_end=5426,
+)
+
+
+_DROPOUTPARAMETER = _descriptor.Descriptor(
+  name='DropoutParameter',
+  full_name='caffe.DropoutParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='dropout_ratio', full_name='caffe.DropoutParameter.dropout_ratio', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5428,
+  serialized_end=5474,
+)
+
+
+_DUMMYDATAPARAMETER = _descriptor.Descriptor(
+  name='DummyDataParameter',
+  full_name='caffe.DummyDataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='data_filler', full_name='caffe.DummyDataParameter.data_filler', index=0,
+      number=1, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shape', full_name='caffe.DummyDataParameter.shape', index=1,
+      number=6, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='num', full_name='caffe.DummyDataParameter.num', index=2,
+      number=2, type=13, cpp_type=3, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='channels', full_name='caffe.DummyDataParameter.channels', index=3,
+      number=3, type=13, cpp_type=3, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='height', full_name='caffe.DummyDataParameter.height', index=4,
+      number=4, type=13, cpp_type=3, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='width', full_name='caffe.DummyDataParameter.width', index=5,
+      number=5, type=13, cpp_type=3, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5477,
+  serialized_end=5637,
+)
+
+
+_ELTWISEPARAMETER = _descriptor.Descriptor(
+  name='EltwiseParameter',
+  full_name='caffe.EltwiseParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='operation', full_name='caffe.EltwiseParameter.operation', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='coeff', full_name='caffe.EltwiseParameter.coeff', index=1,
+      number=2, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stable_prod_grad', full_name='caffe.EltwiseParameter.stable_prod_grad', index=2,
+      number=3, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _ELTWISEPARAMETER_ELTWISEOP,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5640,
+  serialized_end=5805,
+)
+
+
+_EXPPARAMETER = _descriptor.Descriptor(
+  name='ExpParameter',
+  full_name='caffe.ExpParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='base', full_name='caffe.ExpParameter.base', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=-1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.ExpParameter.scale', index=1,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shift', full_name='caffe.ExpParameter.shift', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5807,
+  serialized_end=5875,
+)
+
+
+_HDF5DATAPARAMETER = _descriptor.Descriptor(
+  name='HDF5DataParameter',
+  full_name='caffe.HDF5DataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.HDF5DataParameter.source', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='batch_size', full_name='caffe.HDF5DataParameter.batch_size', index=1,
+      number=2, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shuffle', full_name='caffe.HDF5DataParameter.shuffle', index=2,
+      number=3, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5877,
+  serialized_end=5956,
+)
+
+
+_HDF5OUTPUTPARAMETER = _descriptor.Descriptor(
+  name='HDF5OutputParameter',
+  full_name='caffe.HDF5OutputParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='file_name', full_name='caffe.HDF5OutputParameter.file_name', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=5958,
+  serialized_end=5998,
+)
+
+
+_HINGELOSSPARAMETER = _descriptor.Descriptor(
+  name='HingeLossParameter',
+  full_name='caffe.HingeLossParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='norm', full_name='caffe.HingeLossParameter.norm', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _HINGELOSSPARAMETER_NORM,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6000,
+  serialized_end=6094,
+)
+
+
+_IMAGEDATAPARAMETER = _descriptor.Descriptor(
+  name='ImageDataParameter',
+  full_name='caffe.ImageDataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.ImageDataParameter.source', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='batch_size', full_name='caffe.ImageDataParameter.batch_size', index=1,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='rand_skip', full_name='caffe.ImageDataParameter.rand_skip', index=2,
+      number=7, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shuffle', full_name='caffe.ImageDataParameter.shuffle', index=3,
+      number=8, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_height', full_name='caffe.ImageDataParameter.new_height', index=4,
+      number=9, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_width', full_name='caffe.ImageDataParameter.new_width', index=5,
+      number=10, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='is_color', full_name='caffe.ImageDataParameter.is_color', index=6,
+      number=11, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.ImageDataParameter.scale', index=7,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean_file', full_name='caffe.ImageDataParameter.mean_file', index=8,
+      number=3, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='crop_size', full_name='caffe.ImageDataParameter.crop_size', index=9,
+      number=5, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mirror', full_name='caffe.ImageDataParameter.mirror', index=10,
+      number=6, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='root_folder', full_name='caffe.ImageDataParameter.root_folder', index=11,
+      number=12, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6097,
+  serialized_end=6373,
+)
+
+
+_INFOGAINLOSSPARAMETER = _descriptor.Descriptor(
+  name='InfogainLossParameter',
+  full_name='caffe.InfogainLossParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.InfogainLossParameter.source', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6375,
+  serialized_end=6414,
+)
+
+
+_INNERPRODUCTPARAMETER = _descriptor.Descriptor(
+  name='InnerProductParameter',
+  full_name='caffe.InnerProductParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='num_output', full_name='caffe.InnerProductParameter.num_output', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bias_term', full_name='caffe.InnerProductParameter.bias_term', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_filler', full_name='caffe.InnerProductParameter.weight_filler', index=2,
+      number=3, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bias_filler', full_name='caffe.InnerProductParameter.bias_filler', index=3,
+      number=4, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='axis', full_name='caffe.InnerProductParameter.axis', index=4,
+      number=5, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6417,
+  serialized_end=6594,
+)
+
+
+_LRNPARAMETER = _descriptor.Descriptor(
+  name='LRNParameter',
+  full_name='caffe.LRNParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='local_size', full_name='caffe.LRNParameter.local_size', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='alpha', full_name='caffe.LRNParameter.alpha', index=1,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='beta', full_name='caffe.LRNParameter.beta', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.75,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='norm_region', full_name='caffe.LRNParameter.norm_region', index=3,
+      number=4, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='k', full_name='caffe.LRNParameter.k', index=4,
+      number=5, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _LRNPARAMETER_NORMREGION,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6597,
+  serialized_end=6811,
+)
+
+
+_MEMORYDATAPARAMETER = _descriptor.Descriptor(
+  name='MemoryDataParameter',
+  full_name='caffe.MemoryDataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='batch_size', full_name='caffe.MemoryDataParameter.batch_size', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='channels', full_name='caffe.MemoryDataParameter.channels', index=1,
+      number=2, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='height', full_name='caffe.MemoryDataParameter.height', index=2,
+      number=3, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='width', full_name='caffe.MemoryDataParameter.width', index=3,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6813,
+  serialized_end=6903,
+)
+
+
+_MVNPARAMETER = _descriptor.Descriptor(
+  name='MVNParameter',
+  full_name='caffe.MVNParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='normalize_variance', full_name='caffe.MVNParameter.normalize_variance', index=0,
+      number=1, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='across_channels', full_name='caffe.MVNParameter.across_channels', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6905,
+  serialized_end=6985,
+)
+
+
+_POOLINGPARAMETER = _descriptor.Descriptor(
+  name='PoolingParameter',
+  full_name='caffe.PoolingParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='pool', full_name='caffe.PoolingParameter.pool', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad', full_name='caffe.PoolingParameter.pad', index=1,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad_h', full_name='caffe.PoolingParameter.pad_h', index=2,
+      number=9, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad_w', full_name='caffe.PoolingParameter.pad_w', index=3,
+      number=10, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_size', full_name='caffe.PoolingParameter.kernel_size', index=4,
+      number=2, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_h', full_name='caffe.PoolingParameter.kernel_h', index=5,
+      number=5, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernel_w', full_name='caffe.PoolingParameter.kernel_w', index=6,
+      number=6, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride', full_name='caffe.PoolingParameter.stride', index=7,
+      number=3, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride_h', full_name='caffe.PoolingParameter.stride_h', index=8,
+      number=7, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride_w', full_name='caffe.PoolingParameter.stride_w', index=9,
+      number=8, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.PoolingParameter.engine', index=10,
+      number=11, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='global_pooling', full_name='caffe.PoolingParameter.global_pooling', index=11,
+      number=12, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _POOLINGPARAMETER_POOLMETHOD,
+    _POOLINGPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=6988,
+  serialized_end=7406,
+)
+
+
+_POWERPARAMETER = _descriptor.Descriptor(
+  name='PowerParameter',
+  full_name='caffe.PowerParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='power', full_name='caffe.PowerParameter.power', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.PowerParameter.scale', index=1,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shift', full_name='caffe.PowerParameter.shift', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7408,
+  serialized_end=7478,
+)
+
+
+_PYTHONPARAMETER = _descriptor.Descriptor(
+  name='PythonParameter',
+  full_name='caffe.PythonParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='module', full_name='caffe.PythonParameter.module', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='layer', full_name='caffe.PythonParameter.layer', index=1,
+      number=2, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='param_str', full_name='caffe.PythonParameter.param_str', index=2,
+      number=3, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7480,
+  serialized_end=7549,
+)
+
+
+_RELUPARAMETER = _descriptor.Descriptor(
+  name='ReLUParameter',
+  full_name='caffe.ReLUParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='negative_slope', full_name='caffe.ReLUParameter.negative_slope', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.ReLUParameter.engine', index=1,
+      number=2, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _RELUPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7552,
+  serialized_end=7693,
+)
+
+
+_ROIPOOLINGPARAMETER = _descriptor.Descriptor(
+  name='ROIPoolingParameter',
+  full_name='caffe.ROIPoolingParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='pooled_h', full_name='caffe.ROIPoolingParameter.pooled_h', index=0,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pooled_w', full_name='caffe.ROIPoolingParameter.pooled_w', index=1,
+      number=2, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='spatial_scale', full_name='caffe.ROIPoolingParameter.spatial_scale', index=2,
+      number=3, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7695,
+  serialized_end=7784,
+)
+
+
+_SIGMOIDPARAMETER = _descriptor.Descriptor(
+  name='SigmoidParameter',
+  full_name='caffe.SigmoidParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.SigmoidParameter.engine', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _SIGMOIDPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7786,
+  serialized_end=7906,
+)
+
+
+_SLICEPARAMETER = _descriptor.Descriptor(
+  name='SliceParameter',
+  full_name='caffe.SliceParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='axis', full_name='caffe.SliceParameter.axis', index=0,
+      number=3, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='slice_point', full_name='caffe.SliceParameter.slice_point', index=1,
+      number=2, type=13, cpp_type=3, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='slice_dim', full_name='caffe.SliceParameter.slice_dim', index=2,
+      number=1, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7908,
+  serialized_end=7984,
+)
+
+
+_SOFTMAXPARAMETER = _descriptor.Descriptor(
+  name='SoftmaxParameter',
+  full_name='caffe.SoftmaxParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.SoftmaxParameter.engine', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='axis', full_name='caffe.SoftmaxParameter.axis', index=1,
+      number=2, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _SOFTMAXPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=7987,
+  serialized_end=8124,
+)
+
+
+_TANHPARAMETER = _descriptor.Descriptor(
+  name='TanHParameter',
+  full_name='caffe.TanHParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='engine', full_name='caffe.TanHParameter.engine', index=0,
+      number=1, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _TANHPARAMETER_ENGINE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=8126,
+  serialized_end=8240,
+)
+
+
+_THRESHOLDPARAMETER = _descriptor.Descriptor(
+  name='ThresholdParameter',
+  full_name='caffe.ThresholdParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='threshold', full_name='caffe.ThresholdParameter.threshold', index=0,
+      number=1, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=8242,
+  serialized_end=8284,
+)
+
+
+_WINDOWDATAPARAMETER = _descriptor.Descriptor(
+  name='WindowDataParameter',
+  full_name='caffe.WindowDataParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.WindowDataParameter.source', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.WindowDataParameter.scale', index=1,
+      number=2, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mean_file', full_name='caffe.WindowDataParameter.mean_file', index=2,
+      number=3, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='batch_size', full_name='caffe.WindowDataParameter.batch_size', index=3,
+      number=4, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='crop_size', full_name='caffe.WindowDataParameter.crop_size', index=4,
+      number=5, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mirror', full_name='caffe.WindowDataParameter.mirror', index=5,
+      number=6, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='fg_threshold', full_name='caffe.WindowDataParameter.fg_threshold', index=6,
+      number=7, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bg_threshold', full_name='caffe.WindowDataParameter.bg_threshold', index=7,
+      number=8, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='fg_fraction', full_name='caffe.WindowDataParameter.fg_fraction', index=8,
+      number=9, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.25,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='context_pad', full_name='caffe.WindowDataParameter.context_pad', index=9,
+      number=10, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='crop_mode', full_name='caffe.WindowDataParameter.crop_mode', index=10,
+      number=11, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("warp", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='cache_images', full_name='caffe.WindowDataParameter.cache_images', index=11,
+      number=12, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='root_folder', full_name='caffe.WindowDataParameter.root_folder', index=12,
+      number=13, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=8287,
+  serialized_end=8608,
+)
+
+
+_V1LAYERPARAMETER = _descriptor.Descriptor(
+  name='V1LayerParameter',
+  full_name='caffe.V1LayerParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='bottom', full_name='caffe.V1LayerParameter.bottom', index=0,
+      number=2, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='top', full_name='caffe.V1LayerParameter.top', index=1,
+      number=3, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='name', full_name='caffe.V1LayerParameter.name', index=2,
+      number=4, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='include', full_name='caffe.V1LayerParameter.include', index=3,
+      number=32, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='exclude', full_name='caffe.V1LayerParameter.exclude', index=4,
+      number=33, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='type', full_name='caffe.V1LayerParameter.type', index=5,
+      number=5, type=14, cpp_type=8, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blobs', full_name='caffe.V1LayerParameter.blobs', index=6,
+      number=6, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='param', full_name='caffe.V1LayerParameter.param', index=7,
+      number=1001, type=9, cpp_type=9, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blob_share_mode', full_name='caffe.V1LayerParameter.blob_share_mode', index=8,
+      number=1002, type=14, cpp_type=8, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blobs_lr', full_name='caffe.V1LayerParameter.blobs_lr', index=9,
+      number=7, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_decay', full_name='caffe.V1LayerParameter.weight_decay', index=10,
+      number=8, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='loss_weight', full_name='caffe.V1LayerParameter.loss_weight', index=11,
+      number=35, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='accuracy_param', full_name='caffe.V1LayerParameter.accuracy_param', index=12,
+      number=27, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='argmax_param', full_name='caffe.V1LayerParameter.argmax_param', index=13,
+      number=23, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='concat_param', full_name='caffe.V1LayerParameter.concat_param', index=14,
+      number=9, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='contrastive_loss_param', full_name='caffe.V1LayerParameter.contrastive_loss_param', index=15,
+      number=40, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='convolution_param', full_name='caffe.V1LayerParameter.convolution_param', index=16,
+      number=10, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='data_param', full_name='caffe.V1LayerParameter.data_param', index=17,
+      number=11, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='dropout_param', full_name='caffe.V1LayerParameter.dropout_param', index=18,
+      number=12, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='dummy_data_param', full_name='caffe.V1LayerParameter.dummy_data_param', index=19,
+      number=26, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='eltwise_param', full_name='caffe.V1LayerParameter.eltwise_param', index=20,
+      number=24, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='exp_param', full_name='caffe.V1LayerParameter.exp_param', index=21,
+      number=41, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hdf5_data_param', full_name='caffe.V1LayerParameter.hdf5_data_param', index=22,
+      number=13, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hdf5_output_param', full_name='caffe.V1LayerParameter.hdf5_output_param', index=23,
+      number=14, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hinge_loss_param', full_name='caffe.V1LayerParameter.hinge_loss_param', index=24,
+      number=29, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='image_data_param', full_name='caffe.V1LayerParameter.image_data_param', index=25,
+      number=15, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='infogain_loss_param', full_name='caffe.V1LayerParameter.infogain_loss_param', index=26,
+      number=16, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='inner_product_param', full_name='caffe.V1LayerParameter.inner_product_param', index=27,
+      number=17, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='lrn_param', full_name='caffe.V1LayerParameter.lrn_param', index=28,
+      number=18, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='memory_data_param', full_name='caffe.V1LayerParameter.memory_data_param', index=29,
+      number=22, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mvn_param', full_name='caffe.V1LayerParameter.mvn_param', index=30,
+      number=34, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pooling_param', full_name='caffe.V1LayerParameter.pooling_param', index=31,
+      number=19, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='power_param', full_name='caffe.V1LayerParameter.power_param', index=32,
+      number=21, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='relu_param', full_name='caffe.V1LayerParameter.relu_param', index=33,
+      number=30, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='sigmoid_param', full_name='caffe.V1LayerParameter.sigmoid_param', index=34,
+      number=38, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='softmax_param', full_name='caffe.V1LayerParameter.softmax_param', index=35,
+      number=39, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='slice_param', full_name='caffe.V1LayerParameter.slice_param', index=36,
+      number=31, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='tanh_param', full_name='caffe.V1LayerParameter.tanh_param', index=37,
+      number=37, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='threshold_param', full_name='caffe.V1LayerParameter.threshold_param', index=38,
+      number=25, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='window_data_param', full_name='caffe.V1LayerParameter.window_data_param', index=39,
+      number=20, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='transform_param', full_name='caffe.V1LayerParameter.transform_param', index=40,
+      number=36, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='loss_param', full_name='caffe.V1LayerParameter.loss_param', index=41,
+      number=42, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='layer', full_name='caffe.V1LayerParameter.layer', index=42,
+      number=1, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _V1LAYERPARAMETER_LAYERTYPE,
+    _V1LAYERPARAMETER_DIMCHECKMODE,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=8611,
+  serialized_end=11139,
+)
+
+
+_V0LAYERPARAMETER = _descriptor.Descriptor(
+  name='V0LayerParameter',
+  full_name='caffe.V0LayerParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='name', full_name='caffe.V0LayerParameter.name', index=0,
+      number=1, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='type', full_name='caffe.V0LayerParameter.type', index=1,
+      number=2, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='num_output', full_name='caffe.V0LayerParameter.num_output', index=2,
+      number=3, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='biasterm', full_name='caffe.V0LayerParameter.biasterm', index=3,
+      number=4, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=True,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_filler', full_name='caffe.V0LayerParameter.weight_filler', index=4,
+      number=5, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='bias_filler', full_name='caffe.V0LayerParameter.bias_filler', index=5,
+      number=6, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pad', full_name='caffe.V0LayerParameter.pad', index=6,
+      number=7, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='kernelsize', full_name='caffe.V0LayerParameter.kernelsize', index=7,
+      number=8, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='group', full_name='caffe.V0LayerParameter.group', index=8,
+      number=9, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='stride', full_name='caffe.V0LayerParameter.stride', index=9,
+      number=10, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='pool', full_name='caffe.V0LayerParameter.pool', index=10,
+      number=11, type=14, cpp_type=8, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='dropout_ratio', full_name='caffe.V0LayerParameter.dropout_ratio', index=11,
+      number=12, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='local_size', full_name='caffe.V0LayerParameter.local_size', index=12,
+      number=13, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='alpha', full_name='caffe.V0LayerParameter.alpha', index=13,
+      number=14, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='beta', full_name='caffe.V0LayerParameter.beta', index=14,
+      number=15, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.75,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='k', full_name='caffe.V0LayerParameter.k', index=15,
+      number=22, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='source', full_name='caffe.V0LayerParameter.source', index=16,
+      number=16, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='scale', full_name='caffe.V0LayerParameter.scale', index=17,
+      number=17, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='meanfile', full_name='caffe.V0LayerParameter.meanfile', index=18,
+      number=18, type=9, cpp_type=9, label=1,
+      has_default_value=False, default_value=unicode("", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='batchsize', full_name='caffe.V0LayerParameter.batchsize', index=19,
+      number=19, type=13, cpp_type=3, label=1,
+      has_default_value=False, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='cropsize', full_name='caffe.V0LayerParameter.cropsize', index=20,
+      number=20, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='mirror', full_name='caffe.V0LayerParameter.mirror', index=21,
+      number=21, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blobs', full_name='caffe.V0LayerParameter.blobs', index=22,
+      number=50, type=11, cpp_type=10, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='blobs_lr', full_name='caffe.V0LayerParameter.blobs_lr', index=23,
+      number=51, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='weight_decay', full_name='caffe.V0LayerParameter.weight_decay', index=24,
+      number=52, type=2, cpp_type=6, label=3,
+      has_default_value=False, default_value=[],
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='rand_skip', full_name='caffe.V0LayerParameter.rand_skip', index=25,
+      number=53, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='det_fg_threshold', full_name='caffe.V0LayerParameter.det_fg_threshold', index=26,
+      number=54, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='det_bg_threshold', full_name='caffe.V0LayerParameter.det_bg_threshold', index=27,
+      number=55, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.5,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='det_fg_fraction', full_name='caffe.V0LayerParameter.det_fg_fraction', index=28,
+      number=56, type=2, cpp_type=6, label=1,
+      has_default_value=True, default_value=0.25,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='det_context_pad', full_name='caffe.V0LayerParameter.det_context_pad', index=29,
+      number=58, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='det_crop_mode', full_name='caffe.V0LayerParameter.det_crop_mode', index=30,
+      number=59, type=9, cpp_type=9, label=1,
+      has_default_value=True, default_value=unicode("warp", "utf-8"),
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_num', full_name='caffe.V0LayerParameter.new_num', index=31,
+      number=60, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_channels', full_name='caffe.V0LayerParameter.new_channels', index=32,
+      number=61, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_height', full_name='caffe.V0LayerParameter.new_height', index=33,
+      number=62, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='new_width', full_name='caffe.V0LayerParameter.new_width', index=34,
+      number=63, type=5, cpp_type=1, label=1,
+      has_default_value=True, default_value=0,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='shuffle_images', full_name='caffe.V0LayerParameter.shuffle_images', index=35,
+      number=64, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='concat_dim', full_name='caffe.V0LayerParameter.concat_dim', index=36,
+      number=65, type=13, cpp_type=3, label=1,
+      has_default_value=True, default_value=1,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='hdf5_output_param', full_name='caffe.V0LayerParameter.hdf5_output_param', index=37,
+      number=1001, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+    _V0LAYERPARAMETER_POOLMETHOD,
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=11142,
+  serialized_end=12163,
+)
+
+
+_PRELUPARAMETER = _descriptor.Descriptor(
+  name='PReLUParameter',
+  full_name='caffe.PReLUParameter',
+  filename=None,
+  file=DESCRIPTOR,
+  containing_type=None,
+  fields=[
+    _descriptor.FieldDescriptor(
+      name='filler', full_name='caffe.PReLUParameter.filler', index=0,
+      number=1, type=11, cpp_type=10, label=1,
+      has_default_value=False, default_value=None,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+    _descriptor.FieldDescriptor(
+      name='channel_shared', full_name='caffe.PReLUParameter.channel_shared', index=1,
+      number=2, type=8, cpp_type=7, label=1,
+      has_default_value=True, default_value=False,
+      message_type=None, enum_type=None, containing_type=None,
+      is_extension=False, extension_scope=None,
+      options=None),
+  ],
+  extensions=[
+  ],
+  nested_types=[],
+  enum_types=[
+  ],
+  options=None,
+  is_extendable=False,
+  extension_ranges=[],
+  serialized_start=12165,
+  serialized_end=12252,
+)
+
+_BLOBPROTO.fields_by_name['shape'].message_type = _BLOBSHAPE
+_BLOBPROTOVECTOR.fields_by_name['blobs'].message_type = _BLOBPROTO
+_NETPARAMETER.fields_by_name['input_shape'].message_type = _BLOBSHAPE
+_NETPARAMETER.fields_by_name['state'].message_type = _NETSTATE
+_NETPARAMETER.fields_by_name['layer'].message_type = _LAYERPARAMETER
+_NETPARAMETER.fields_by_name['layers'].message_type = _V1LAYERPARAMETER
+_SOLVERPARAMETER.fields_by_name['net_param'].message_type = _NETPARAMETER
+_SOLVERPARAMETER.fields_by_name['train_net_param'].message_type = _NETPARAMETER
+_SOLVERPARAMETER.fields_by_name['test_net_param'].message_type = _NETPARAMETER
+_SOLVERPARAMETER.fields_by_name['train_state'].message_type = _NETSTATE
+_SOLVERPARAMETER.fields_by_name['test_state'].message_type = _NETSTATE
+_SOLVERPARAMETER.fields_by_name['solver_mode'].enum_type = _SOLVERPARAMETER_SOLVERMODE
+_SOLVERPARAMETER.fields_by_name['solver_type'].enum_type = _SOLVERPARAMETER_SOLVERTYPE
+_SOLVERPARAMETER_SOLVERMODE.containing_type = _SOLVERPARAMETER;
+_SOLVERPARAMETER_SOLVERTYPE.containing_type = _SOLVERPARAMETER;
+_SOLVERSTATE.fields_by_name['history'].message_type = _BLOBPROTO
+_NETSTATE.fields_by_name['phase'].enum_type = _PHASE
+_NETSTATERULE.fields_by_name['phase'].enum_type = _PHASE
+_PARAMSPEC.fields_by_name['share_mode'].enum_type = _PARAMSPEC_DIMCHECKMODE
+_PARAMSPEC_DIMCHECKMODE.containing_type = _PARAMSPEC;
+_LAYERPARAMETER.fields_by_name['phase'].enum_type = _PHASE
+_LAYERPARAMETER.fields_by_name['param'].message_type = _PARAMSPEC
+_LAYERPARAMETER.fields_by_name['blobs'].message_type = _BLOBPROTO
+_LAYERPARAMETER.fields_by_name['include'].message_type = _NETSTATERULE
+_LAYERPARAMETER.fields_by_name['exclude'].message_type = _NETSTATERULE
+_LAYERPARAMETER.fields_by_name['transform_param'].message_type = _TRANSFORMATIONPARAMETER
+_LAYERPARAMETER.fields_by_name['loss_param'].message_type = _LOSSPARAMETER
+_LAYERPARAMETER.fields_by_name['accuracy_param'].message_type = _ACCURACYPARAMETER
+_LAYERPARAMETER.fields_by_name['argmax_param'].message_type = _ARGMAXPARAMETER
+_LAYERPARAMETER.fields_by_name['concat_param'].message_type = _CONCATPARAMETER
+_LAYERPARAMETER.fields_by_name['contrastive_loss_param'].message_type = _CONTRASTIVELOSSPARAMETER
+_LAYERPARAMETER.fields_by_name['convolution_param'].message_type = _CONVOLUTIONPARAMETER
+_LAYERPARAMETER.fields_by_name['data_param'].message_type = _DATAPARAMETER
+_LAYERPARAMETER.fields_by_name['dropout_param'].message_type = _DROPOUTPARAMETER
+_LAYERPARAMETER.fields_by_name['dummy_data_param'].message_type = _DUMMYDATAPARAMETER
+_LAYERPARAMETER.fields_by_name['eltwise_param'].message_type = _ELTWISEPARAMETER
+_LAYERPARAMETER.fields_by_name['exp_param'].message_type = _EXPPARAMETER
+_LAYERPARAMETER.fields_by_name['hdf5_data_param'].message_type = _HDF5DATAPARAMETER
+_LAYERPARAMETER.fields_by_name['hdf5_output_param'].message_type = _HDF5OUTPUTPARAMETER
+_LAYERPARAMETER.fields_by_name['hinge_loss_param'].message_type = _HINGELOSSPARAMETER
+_LAYERPARAMETER.fields_by_name['image_data_param'].message_type = _IMAGEDATAPARAMETER
+_LAYERPARAMETER.fields_by_name['infogain_loss_param'].message_type = _INFOGAINLOSSPARAMETER
+_LAYERPARAMETER.fields_by_name['inner_product_param'].message_type = _INNERPRODUCTPARAMETER
+_LAYERPARAMETER.fields_by_name['lrn_param'].message_type = _LRNPARAMETER
+_LAYERPARAMETER.fields_by_name['memory_data_param'].message_type = _MEMORYDATAPARAMETER
+_LAYERPARAMETER.fields_by_name['mvn_param'].message_type = _MVNPARAMETER
+_LAYERPARAMETER.fields_by_name['pooling_param'].message_type = _POOLINGPARAMETER
+_LAYERPARAMETER.fields_by_name['power_param'].message_type = _POWERPARAMETER
+_LAYERPARAMETER.fields_by_name['prelu_param'].message_type = _PRELUPARAMETER
+_LAYERPARAMETER.fields_by_name['python_param'].message_type = _PYTHONPARAMETER
+_LAYERPARAMETER.fields_by_name['relu_param'].message_type = _RELUPARAMETER
+_LAYERPARAMETER.fields_by_name['roi_pooling_param'].message_type = _ROIPOOLINGPARAMETER
+_LAYERPARAMETER.fields_by_name['sigmoid_param'].message_type = _SIGMOIDPARAMETER
+_LAYERPARAMETER.fields_by_name['softmax_param'].message_type = _SOFTMAXPARAMETER
+_LAYERPARAMETER.fields_by_name['slice_param'].message_type = _SLICEPARAMETER
+_LAYERPARAMETER.fields_by_name['tanh_param'].message_type = _TANHPARAMETER
+_LAYERPARAMETER.fields_by_name['threshold_param'].message_type = _THRESHOLDPARAMETER
+_LAYERPARAMETER.fields_by_name['window_data_param'].message_type = _WINDOWDATAPARAMETER
+_CONVOLUTIONPARAMETER.fields_by_name['weight_filler'].message_type = _FILLERPARAMETER
+_CONVOLUTIONPARAMETER.fields_by_name['bias_filler'].message_type = _FILLERPARAMETER
+_CONVOLUTIONPARAMETER.fields_by_name['engine'].enum_type = _CONVOLUTIONPARAMETER_ENGINE
+_CONVOLUTIONPARAMETER_ENGINE.containing_type = _CONVOLUTIONPARAMETER;
+_DATAPARAMETER.fields_by_name['backend'].enum_type = _DATAPARAMETER_DB
+_DATAPARAMETER_DB.containing_type = _DATAPARAMETER;
+_DUMMYDATAPARAMETER.fields_by_name['data_filler'].message_type = _FILLERPARAMETER
+_DUMMYDATAPARAMETER.fields_by_name['shape'].message_type = _BLOBSHAPE
+_ELTWISEPARAMETER.fields_by_name['operation'].enum_type = _ELTWISEPARAMETER_ELTWISEOP
+_ELTWISEPARAMETER_ELTWISEOP.containing_type = _ELTWISEPARAMETER;
+_HINGELOSSPARAMETER.fields_by_name['norm'].enum_type = _HINGELOSSPARAMETER_NORM
+_HINGELOSSPARAMETER_NORM.containing_type = _HINGELOSSPARAMETER;
+_INNERPRODUCTPARAMETER.fields_by_name['weight_filler'].message_type = _FILLERPARAMETER
+_INNERPRODUCTPARAMETER.fields_by_name['bias_filler'].message_type = _FILLERPARAMETER
+_LRNPARAMETER.fields_by_name['norm_region'].enum_type = _LRNPARAMETER_NORMREGION
+_LRNPARAMETER_NORMREGION.containing_type = _LRNPARAMETER;
+_POOLINGPARAMETER.fields_by_name['pool'].enum_type = _POOLINGPARAMETER_POOLMETHOD
+_POOLINGPARAMETER.fields_by_name['engine'].enum_type = _POOLINGPARAMETER_ENGINE
+_POOLINGPARAMETER_POOLMETHOD.containing_type = _POOLINGPARAMETER;
+_POOLINGPARAMETER_ENGINE.containing_type = _POOLINGPARAMETER;
+_RELUPARAMETER.fields_by_name['engine'].enum_type = _RELUPARAMETER_ENGINE
+_RELUPARAMETER_ENGINE.containing_type = _RELUPARAMETER;
+_SIGMOIDPARAMETER.fields_by_name['engine'].enum_type = _SIGMOIDPARAMETER_ENGINE
+_SIGMOIDPARAMETER_ENGINE.containing_type = _SIGMOIDPARAMETER;
+_SOFTMAXPARAMETER.fields_by_name['engine'].enum_type = _SOFTMAXPARAMETER_ENGINE
+_SOFTMAXPARAMETER_ENGINE.containing_type = _SOFTMAXPARAMETER;
+_TANHPARAMETER.fields_by_name['engine'].enum_type = _TANHPARAMETER_ENGINE
+_TANHPARAMETER_ENGINE.containing_type = _TANHPARAMETER;
+_V1LAYERPARAMETER.fields_by_name['include'].message_type = _NETSTATERULE
+_V1LAYERPARAMETER.fields_by_name['exclude'].message_type = _NETSTATERULE
+_V1LAYERPARAMETER.fields_by_name['type'].enum_type = _V1LAYERPARAMETER_LAYERTYPE
+_V1LAYERPARAMETER.fields_by_name['blobs'].message_type = _BLOBPROTO
+_V1LAYERPARAMETER.fields_by_name['blob_share_mode'].enum_type = _V1LAYERPARAMETER_DIMCHECKMODE
+_V1LAYERPARAMETER.fields_by_name['accuracy_param'].message_type = _ACCURACYPARAMETER
+_V1LAYERPARAMETER.fields_by_name['argmax_param'].message_type = _ARGMAXPARAMETER
+_V1LAYERPARAMETER.fields_by_name['concat_param'].message_type = _CONCATPARAMETER
+_V1LAYERPARAMETER.fields_by_name['contrastive_loss_param'].message_type = _CONTRASTIVELOSSPARAMETER
+_V1LAYERPARAMETER.fields_by_name['convolution_param'].message_type = _CONVOLUTIONPARAMETER
+_V1LAYERPARAMETER.fields_by_name['data_param'].message_type = _DATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['dropout_param'].message_type = _DROPOUTPARAMETER
+_V1LAYERPARAMETER.fields_by_name['dummy_data_param'].message_type = _DUMMYDATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['eltwise_param'].message_type = _ELTWISEPARAMETER
+_V1LAYERPARAMETER.fields_by_name['exp_param'].message_type = _EXPPARAMETER
+_V1LAYERPARAMETER.fields_by_name['hdf5_data_param'].message_type = _HDF5DATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['hdf5_output_param'].message_type = _HDF5OUTPUTPARAMETER
+_V1LAYERPARAMETER.fields_by_name['hinge_loss_param'].message_type = _HINGELOSSPARAMETER
+_V1LAYERPARAMETER.fields_by_name['image_data_param'].message_type = _IMAGEDATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['infogain_loss_param'].message_type = _INFOGAINLOSSPARAMETER
+_V1LAYERPARAMETER.fields_by_name['inner_product_param'].message_type = _INNERPRODUCTPARAMETER
+_V1LAYERPARAMETER.fields_by_name['lrn_param'].message_type = _LRNPARAMETER
+_V1LAYERPARAMETER.fields_by_name['memory_data_param'].message_type = _MEMORYDATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['mvn_param'].message_type = _MVNPARAMETER
+_V1LAYERPARAMETER.fields_by_name['pooling_param'].message_type = _POOLINGPARAMETER
+_V1LAYERPARAMETER.fields_by_name['power_param'].message_type = _POWERPARAMETER
+_V1LAYERPARAMETER.fields_by_name['relu_param'].message_type = _RELUPARAMETER
+_V1LAYERPARAMETER.fields_by_name['sigmoid_param'].message_type = _SIGMOIDPARAMETER
+_V1LAYERPARAMETER.fields_by_name['softmax_param'].message_type = _SOFTMAXPARAMETER
+_V1LAYERPARAMETER.fields_by_name['slice_param'].message_type = _SLICEPARAMETER
+_V1LAYERPARAMETER.fields_by_name['tanh_param'].message_type = _TANHPARAMETER
+_V1LAYERPARAMETER.fields_by_name['threshold_param'].message_type = _THRESHOLDPARAMETER
+_V1LAYERPARAMETER.fields_by_name['window_data_param'].message_type = _WINDOWDATAPARAMETER
+_V1LAYERPARAMETER.fields_by_name['transform_param'].message_type = _TRANSFORMATIONPARAMETER
+_V1LAYERPARAMETER.fields_by_name['loss_param'].message_type = _LOSSPARAMETER
+_V1LAYERPARAMETER.fields_by_name['layer'].message_type = _V0LAYERPARAMETER
+_V1LAYERPARAMETER_LAYERTYPE.containing_type = _V1LAYERPARAMETER;
+_V1LAYERPARAMETER_DIMCHECKMODE.containing_type = _V1LAYERPARAMETER;
+_V0LAYERPARAMETER.fields_by_name['weight_filler'].message_type = _FILLERPARAMETER
+_V0LAYERPARAMETER.fields_by_name['bias_filler'].message_type = _FILLERPARAMETER
+_V0LAYERPARAMETER.fields_by_name['pool'].enum_type = _V0LAYERPARAMETER_POOLMETHOD
+_V0LAYERPARAMETER.fields_by_name['blobs'].message_type = _BLOBPROTO
+_V0LAYERPARAMETER.fields_by_name['hdf5_output_param'].message_type = _HDF5OUTPUTPARAMETER
+_V0LAYERPARAMETER_POOLMETHOD.containing_type = _V0LAYERPARAMETER;
+_PRELUPARAMETER.fields_by_name['filler'].message_type = _FILLERPARAMETER
+DESCRIPTOR.message_types_by_name['BlobShape'] = _BLOBSHAPE
+DESCRIPTOR.message_types_by_name['BlobProto'] = _BLOBPROTO
+DESCRIPTOR.message_types_by_name['BlobProtoVector'] = _BLOBPROTOVECTOR
+DESCRIPTOR.message_types_by_name['Datum'] = _DATUM
+DESCRIPTOR.message_types_by_name['FillerParameter'] = _FILLERPARAMETER
+DESCRIPTOR.message_types_by_name['NetParameter'] = _NETPARAMETER
+DESCRIPTOR.message_types_by_name['SolverParameter'] = _SOLVERPARAMETER
+DESCRIPTOR.message_types_by_name['SolverState'] = _SOLVERSTATE
+DESCRIPTOR.message_types_by_name['NetState'] = _NETSTATE
+DESCRIPTOR.message_types_by_name['NetStateRule'] = _NETSTATERULE
+DESCRIPTOR.message_types_by_name['ParamSpec'] = _PARAMSPEC
+DESCRIPTOR.message_types_by_name['LayerParameter'] = _LAYERPARAMETER
+DESCRIPTOR.message_types_by_name['TransformationParameter'] = _TRANSFORMATIONPARAMETER
+DESCRIPTOR.message_types_by_name['LossParameter'] = _LOSSPARAMETER
+DESCRIPTOR.message_types_by_name['AccuracyParameter'] = _ACCURACYPARAMETER
+DESCRIPTOR.message_types_by_name['ArgMaxParameter'] = _ARGMAXPARAMETER
+DESCRIPTOR.message_types_by_name['ConcatParameter'] = _CONCATPARAMETER
+DESCRIPTOR.message_types_by_name['ContrastiveLossParameter'] = _CONTRASTIVELOSSPARAMETER
+DESCRIPTOR.message_types_by_name['ConvolutionParameter'] = _CONVOLUTIONPARAMETER
+DESCRIPTOR.message_types_by_name['DataParameter'] = _DATAPARAMETER
+DESCRIPTOR.message_types_by_name['DropoutParameter'] = _DROPOUTPARAMETER
+DESCRIPTOR.message_types_by_name['DummyDataParameter'] = _DUMMYDATAPARAMETER
+DESCRIPTOR.message_types_by_name['EltwiseParameter'] = _ELTWISEPARAMETER
+DESCRIPTOR.message_types_by_name['ExpParameter'] = _EXPPARAMETER
+DESCRIPTOR.message_types_by_name['HDF5DataParameter'] = _HDF5DATAPARAMETER
+DESCRIPTOR.message_types_by_name['HDF5OutputParameter'] = _HDF5OUTPUTPARAMETER
+DESCRIPTOR.message_types_by_name['HingeLossParameter'] = _HINGELOSSPARAMETER
+DESCRIPTOR.message_types_by_name['ImageDataParameter'] = _IMAGEDATAPARAMETER
+DESCRIPTOR.message_types_by_name['InfogainLossParameter'] = _INFOGAINLOSSPARAMETER
+DESCRIPTOR.message_types_by_name['InnerProductParameter'] = _INNERPRODUCTPARAMETER
+DESCRIPTOR.message_types_by_name['LRNParameter'] = _LRNPARAMETER
+DESCRIPTOR.message_types_by_name['MemoryDataParameter'] = _MEMORYDATAPARAMETER
+DESCRIPTOR.message_types_by_name['MVNParameter'] = _MVNPARAMETER
+DESCRIPTOR.message_types_by_name['PoolingParameter'] = _POOLINGPARAMETER
+DESCRIPTOR.message_types_by_name['PowerParameter'] = _POWERPARAMETER
+DESCRIPTOR.message_types_by_name['PythonParameter'] = _PYTHONPARAMETER
+DESCRIPTOR.message_types_by_name['ReLUParameter'] = _RELUPARAMETER
+DESCRIPTOR.message_types_by_name['ROIPoolingParameter'] = _ROIPOOLINGPARAMETER
+DESCRIPTOR.message_types_by_name['SigmoidParameter'] = _SIGMOIDPARAMETER
+DESCRIPTOR.message_types_by_name['SliceParameter'] = _SLICEPARAMETER
+DESCRIPTOR.message_types_by_name['SoftmaxParameter'] = _SOFTMAXPARAMETER
+DESCRIPTOR.message_types_by_name['TanHParameter'] = _TANHPARAMETER
+DESCRIPTOR.message_types_by_name['ThresholdParameter'] = _THRESHOLDPARAMETER
+DESCRIPTOR.message_types_by_name['WindowDataParameter'] = _WINDOWDATAPARAMETER
+DESCRIPTOR.message_types_by_name['V1LayerParameter'] = _V1LAYERPARAMETER
+DESCRIPTOR.message_types_by_name['V0LayerParameter'] = _V0LAYERPARAMETER
+DESCRIPTOR.message_types_by_name['PReLUParameter'] = _PRELUPARAMETER
+
+class BlobShape(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _BLOBSHAPE
+
+  # @@protoc_insertion_point(class_scope:caffe.BlobShape)
+
+class BlobProto(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _BLOBPROTO
+
+  # @@protoc_insertion_point(class_scope:caffe.BlobProto)
+
+class BlobProtoVector(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _BLOBPROTOVECTOR
+
+  # @@protoc_insertion_point(class_scope:caffe.BlobProtoVector)
+
+class Datum(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _DATUM
+
+  # @@protoc_insertion_point(class_scope:caffe.Datum)
+
+class FillerParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _FILLERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.FillerParameter)
+
+class NetParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _NETPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.NetParameter)
+
+class SolverParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _SOLVERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.SolverParameter)
+
+class SolverState(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _SOLVERSTATE
+
+  # @@protoc_insertion_point(class_scope:caffe.SolverState)
+
+class NetState(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _NETSTATE
+
+  # @@protoc_insertion_point(class_scope:caffe.NetState)
+
+class NetStateRule(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _NETSTATERULE
+
+  # @@protoc_insertion_point(class_scope:caffe.NetStateRule)
+
+class ParamSpec(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _PARAMSPEC
+
+  # @@protoc_insertion_point(class_scope:caffe.ParamSpec)
+
+class LayerParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _LAYERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.LayerParameter)
+
+class TransformationParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _TRANSFORMATIONPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.TransformationParameter)
+
+class LossParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _LOSSPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.LossParameter)
+
+class AccuracyParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _ACCURACYPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.AccuracyParameter)
+
+class ArgMaxParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _ARGMAXPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ArgMaxParameter)
+
+class ConcatParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _CONCATPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ConcatParameter)
+
+class ContrastiveLossParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _CONTRASTIVELOSSPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ContrastiveLossParameter)
+
+class ConvolutionParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _CONVOLUTIONPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ConvolutionParameter)
+
+class DataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _DATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.DataParameter)
+
+class DropoutParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _DROPOUTPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.DropoutParameter)
+
+class DummyDataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _DUMMYDATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.DummyDataParameter)
+
+class EltwiseParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _ELTWISEPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.EltwiseParameter)
+
+class ExpParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _EXPPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ExpParameter)
+
+class HDF5DataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _HDF5DATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.HDF5DataParameter)
+
+class HDF5OutputParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _HDF5OUTPUTPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.HDF5OutputParameter)
+
+class HingeLossParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _HINGELOSSPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.HingeLossParameter)
+
+class ImageDataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _IMAGEDATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ImageDataParameter)
+
+class InfogainLossParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _INFOGAINLOSSPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.InfogainLossParameter)
+
+class InnerProductParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _INNERPRODUCTPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.InnerProductParameter)
+
+class LRNParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _LRNPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.LRNParameter)
+
+class MemoryDataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _MEMORYDATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.MemoryDataParameter)
+
+class MVNParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _MVNPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.MVNParameter)
+
+class PoolingParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _POOLINGPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.PoolingParameter)
+
+class PowerParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _POWERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.PowerParameter)
+
+class PythonParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _PYTHONPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.PythonParameter)
+
+class ReLUParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _RELUPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ReLUParameter)
+
+class ROIPoolingParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _ROIPOOLINGPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ROIPoolingParameter)
+
+class SigmoidParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _SIGMOIDPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.SigmoidParameter)
+
+class SliceParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _SLICEPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.SliceParameter)
+
+class SoftmaxParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _SOFTMAXPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.SoftmaxParameter)
+
+class TanHParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _TANHPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.TanHParameter)
+
+class ThresholdParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _THRESHOLDPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.ThresholdParameter)
+
+class WindowDataParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _WINDOWDATAPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.WindowDataParameter)
+
+class V1LayerParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _V1LAYERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.V1LayerParameter)
+
+class V0LayerParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _V0LAYERPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.V0LayerParameter)
+
+class PReLUParameter(_message.Message):
+  __metaclass__ = _reflection.GeneratedProtocolMessageType
+  DESCRIPTOR = _PRELUPARAMETER
+
+  # @@protoc_insertion_point(class_scope:caffe.PReLUParameter)
+
+
+_BLOBSHAPE.fields_by_name['dim'].has_options = True
+_BLOBSHAPE.fields_by_name['dim']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')
+_BLOBPROTO.fields_by_name['data'].has_options = True
+_BLOBPROTO.fields_by_name['data']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')
+_BLOBPROTO.fields_by_name['diff'].has_options = True
+_BLOBPROTO.fields_by_name['diff']._options = _descriptor._ParseOptions(descriptor_pb2.FieldOptions(), '\020\001')
+# @@protoc_insertion_point(module_scope)
diff --git a/utils/tidy_ref_models.m b/utils/tidy_ref_models.m
index 95ba41d1..f310651d 100644
--- a/utils/tidy_ref_models.m
+++ b/utils/tidy_ref_models.m
@@ -29,6 +29,9 @@ function tidy_ref_models()
   'pascal-fcn8s-dag', ...
   'pascal-fcn8s-tvg-dag', ...
   'vgg-face', ...
+  'fast-rcnn-caffenet-pascal07-dagnn', ...
+  'fast-rcnn-vggm1k-pascal07-dagnn', ...
+  'fast-rcnn-vgg16-pascal07-dagnn', ...
          }  ;
 
 mkdir(fullfile('data', 'models')) ;