tensorlayer
diff --git a/‎tensorlayer/third_party/roi_pooling‎
Lines changed: 0 additions & 1 deletion b/‎tensorlayer/third_party/roi_pooling‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎tensorlayer/third_party/roi_pooling/.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎tensorlayer/third_party/roi_pooling/.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎tensorlayer/third_party/roi_pooling/README.md‎
Lines changed: 56 additions & 0 deletions b/‎tensorlayer/third_party/roi_pooling/README.md‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎tensorlayer/third_party/roi_pooling/examples/__init__.py‎ b/‎tensorlayer/third_party/roi_pooling/examples/__init__.py‎
diff --git a/‎tensorlayer/third_party/roi_pooling/examples/roi_pooling_minimal_example.ipynb‎
Lines changed: 148 additions & 0 deletions b/‎tensorlayer/third_party/roi_pooling/examples/roi_pooling_minimal_example.ipynb‎
Lines changed: 148 additions & 0 deletions
diff --git a/‎tensorlayer/third_party/roi_pooling/roi_pooling/.Makefile.swp‎
4 KB b/‎tensorlayer/third_party/roi_pooling/roi_pooling/.Makefile.swp‎
4 KB
diff --git a/‎tensorlayer/third_party/roi_pooling/roi_pooling/Makefile‎
Lines changed: 18 additions & 0 deletions b/‎tensorlayer/third_party/roi_pooling/roi_pooling/Makefile‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎tensorlayer/third_party/roi_pooling/roi_pooling/__init__.py‎ b/‎tensorlayer/third_party/roi_pooling/roi_pooling/__init__.py‎
diff --git a/‎tensorlayer/third_party/roi_pooling/roi_pooling/roi_pooling.cc‎
Lines changed: 162 additions & 0 deletions b/‎tensorlayer/third_party/roi_pooling/roi_pooling/roi_pooling.cc‎
Lines changed: 162 additions & 0 deletions
@@ -0,0 +1,3 @@
+.ipynb_checkpoints/
+build/
+
@@ -0,0 +1,56 @@
+# Hint from TensorLayer
+- From `https://github.com/deepsense-ai/roi-pooling` 
+- Date 31 Aug 2017
+- Remember to modify the `CUDA_LIB` in Makefile before `python setup.py install`.
+- Make sure `roi_pooling_example.py` and `test_roi_layer.py` is runable.
+
+
+----
+
+ 
+## RoI pooling in TensorFlow
+
+This repo contains the implementation of **Region of Interest pooling** as a custom TensorFlow operation. The CUDA code responsible for the computations was largely taken from the original [Caffe implementation by Ross Girshick](https://github.com/rbgirshick/fast-rcnn).
+
+For more information about RoI pooling you can check out [Region of interest pooling explained](https://deepsense.io/region-of-interest-pooling-explained/) at our [deepsense.io](https://deepsense.io/) blog.
+
+![Region of Interest Pooling animation](roi_pooling_animation.gif)
+
+
+## Requirements
+
+To compile and use `roi_pooling` layer you need to have:
+
+* [CUDA](https://developer.nvidia.com/cuda-toolkit) (tested with 8.0)
+* [https://www.tensorflow.org/](TensorFlow) (tested with 0.12.0 and 1.0.0)
+
+Only official TensorFlow releases are currently supported. If you're using a custom built TensorFlow compiled with a different GCC version (e.g. 5.X) you may need to modify the makefile to [enable the new ABI version](https://gcc.gnu.org/onlinedocs/libstdc++/manual/using_dual_abi.html).
+
+
+## Install
+
+Since it uses compilation
+
+```bash
+$ git clone [email protected]:deepsense-io/roi-pooling.git
+$ cd roi-pooling
+$ python setup.py install
+```
+
+Right now we provide only GPU implementation (no CPU at this time).
+
+
+## Usage
+
+After successful installation you can use the operation like this:
+
+```python
+from roi_pooling.roi_pooling_ops import roi_pooling
+
+# here obtain feature map and regions of interest
+rpooling = roi_pooling(feature_map, rois, 7, 7)
+# continue the model
+```
+
+Working example in Jupyter Notebook: [examples/roi_pooling_minimal_example.ipynb](https://github.com/deepsense-io/roi-pooling/blob/master/examples/roi_pooling_minimal_example.ipynb)
+
@@ -0,0 +1,148 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "* blog post: [Region of interest pooling explained - deepsense.io](https://deepsense.io/region-of-interest-pooling-explained/)\n",
+    "* repository: [deepsense-io/roi-pooling](https://github.com/deepsense-io/roi-pooling)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "from __future__ import print_function\n",
+    "\n",
+    "import tensorflow as tf\n",
+    "import numpy as np\n",
+    "\n",
+    "from roi_pooling.roi_pooling_ops import roi_pooling"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# 4x4 feature map with only 1 channel\n",
+    "input_value = [[\n",
+    "    [[1], [2], [4], [4]],\n",
+    "    [[3], [4], [1], [2]],\n",
+    "    [[6], [2], [1], [7]],\n",
+    "    [[1], [3], [2], [8]]\n",
+    "]]\n",
+    "input_value = np.asarray(input_value, dtype='float32')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# regions of interest as lists of:\n",
+    "# feature map index, upper left, bottom right coordinates\n",
+    "rois_value = [\n",
+    "    [0, 0, 0, 1, 3],\n",
+    "    [0, 2, 2, 3, 3],\n",
+    "    [0, 1, 0, 3, 2]\n",
+    "]\n",
+    "rois_value = np.asarray(rois_value, dtype='int32')\n",
+    "\n",
+    "# in this case we have 3 RoI pooling operations:\n",
+    "# * channel 0, rectangular region (0, 0) to (1, 3)\n",
+    "#              xx..\n",
+    "#              xx..\n",
+    "#              xx..\n",
+    "#              xx..\n",
+    "#\n",
+    "# * channel 0, rectangular region (2, 2) to (3, 3)\n",
+    "#              ....\n",
+    "#              ....\n",
+    "#              ..xx\n",
+    "#              ..xx\n",
+    "# * channel 0, rectangular region (1, 0) to (3, 2)\n",
+    "#              ....\n",
+    "#              xxx.\n",
+    "#              xxx.\n",
+    "#              xxx."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[[[[ 3.  4.]\n",
+      "   [ 6.  3.]]]\n",
+      "\n",
+      "\n",
+      " [[[ 1.  7.]\n",
+      "   [ 2.  8.]]]\n",
+      "\n",
+      "\n",
+      " [[[ 4.  4.]\n",
+      "   [ 4.  7.]]]]\n"
+     ]
+    }
+   ],
+   "source": [
+    "input_featuremap = tf.placeholder(tf.float32)\n",
+    "rois = tf.placeholder(tf.int32)\n",
+    "input_const = tf.constant(input_value, tf.float32)\n",
+    "rois_const = tf.constant(rois_value, tf.int32)\n",
+    "y = roi_pooling(input_const, rois_const, pool_height=2, pool_width=2)\n",
+    "\n",
+    "with tf.Session('') as sess:\n",
+    "    y_output = sess.run(y, feed_dict={input_featuremap: input_value, rois: rois_value})\n",
+    "    print(y_output)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 2",
+   "language": "python",
+   "name": "python2"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
@@ -0,0 +1,18 @@
+TF_INC = $(shell python -c 'import tensorflow as tf; print(tf.sysconfig.get_include())')
+CUDA_LIB = /usr/local/cuda-8.0/lib64
+
+all: clean build test
+
+build: roi_pooling.so
+
+roi_pooling.cu.o: roi_pooling.cu.cc
+	nvcc -std=c++11 -c -o $@ $? -I $(TF_INC) -D GOOGLE_CUDA=1 -x cu -Xcompiler -fPIC -D _GLIBCXX_USE_CXX11_ABI=0
+
+roi_pooling.so: roi_pooling.cc roi_pooling.cu.o
+	g++ -std=c++11 -shared -o $@ $? -I $(TF_INC) -fPIC -lcudart -L$(CUDA_LIB) -D _GLIBCXX_USE_CXX11_ABI=0
+
+test: build
+	python roi_pooling_test.py
+
+clean:
+	rm -f *.o *.so *.pyc *.npy
@@ -0,0 +1,162 @@
+#include "tensorflow/core/framework/op.h"
+#include "tensorflow/core/framework/op_kernel.h"
+#include <cstdio>
+#include <iostream>
+#include <typeinfo>
+
+using namespace tensorflow;
+using namespace std;
+
+REGISTER_OP("RoiPooling")
+.Input("input: float32")
+.Input("rois: int32")
+.Attr("pool_height: int")
+.Attr("pool_width: int")
+.Output("output: float32")
+.Output("argmax_output: int32");
+
+
+#define Dtype float
+
+void RoiPoolingKernelLauncher(const float* input, const int* rois, int n_rois, int channels, int height, int width,
+                              int pooled_height, int pooled_width, Dtype* output, int* argmax_output);
+
+// IMPORTANT(maciek): need info about storage of the data in memory, assumed something but need the docs confirming it
+
+class RoiPoolingOp : public OpKernel {
+    private:
+        int pool_height_, pool_width_;
+    public:
+        explicit RoiPoolingOp(OpKernelConstruction* context) : OpKernel(context) {
+                 OP_REQUIRES_OK(context,
+                   context->GetAttr("pool_height", &pool_height_));
+
+                 OP_REQUIRES_OK(context,
+                   context->GetAttr("pool_width", &pool_width_));
+        }
+
+
+        void Compute(OpKernelContext* context) override {
+            // Grab the input tensor
+            const Tensor& input_tensor = context->input(0);
+            const Tensor& rois_tensor = context->input(1);
+
+            auto input = input_tensor.flat<float>();
+            auto rois = rois_tensor.flat<int32>();
+
+            // Create an output tensor
+            Tensor* output_tensor = NULL;
+            Tensor* argmax_output_tensor = NULL;
+
+            auto input_shape = input_tensor.shape();
+            auto rois_shape = rois_tensor.shape();
+
+            int n_rois = rois_shape.dim_size(0);
+            int height = input_shape.dim_size(1);
+            int width = input_shape.dim_size(2);
+            int channels = input_shape.dim_size(3);
+
+            TensorShape output_shape = TensorShape({static_cast<int64>(n_rois),
+                                        static_cast<int64>(channels),
+                                        static_cast<int64>(pool_height_),
+                                        static_cast<int64>(pool_width_)});
+
+            OP_REQUIRES_OK(context, context->allocate_output(0, output_shape,
+                        &output_tensor));
+
+            OP_REQUIRES_OK(context, context->allocate_output(1, output_shape,
+                        &argmax_output_tensor));
+
+            auto output = output_tensor->template flat<float>();
+            auto argmax_output = argmax_output_tensor->template flat<int32>();
+
+            RoiPoolingKernelLauncher(input.data(), rois.data(),
+                n_rois, channels,
+                height, width,
+                pool_height_, pool_width_,
+                output.data(), argmax_output.data());
+        }
+};
+
+REGISTER_KERNEL_BUILDER(Name("RoiPooling").Device(DEVICE_GPU), RoiPoolingOp);
+
+///////////// RoiPoolingGrad
+
+
+REGISTER_OP("RoiPoolingGrad")
+.Input("orig_input: float32")
+.Input("orig_rois: int32")
+.Input("orig_output: float32")
+.Input("orig_argmax_output: int32")
+.Input("orig_output_grad: float32")
+.Attr("pool_height: int")
+.Attr("pool_width: int")
+.Output("output: float32")
+.Doc(R"doc(
+ region of interest pooling grad
+)doc");
+
+#define Dtype float
+void RoiPoolingGradKernelLauncher(const Dtype* orig_input, const int* orig_rois,
+                                 int mb_size,
+                                 int n_rois, int channels, int height, int width,
+                                 int pooled_height, int pooled_width,
+                                 const Dtype* orig_output, const int* orig_argmax_output,
+                                 const Dtype* orig_output_grad,
+                                 Dtype* output);
+
+// IMPORTANT(maciek): need info about storage of the data in memory, assumed something but need the docs confirming it
+
+class RoiPoolingGradOp : public OpKernel {
+    private:
+        int pool_height_, pool_width_;
+    public:
+        explicit RoiPoolingGradOp(OpKernelConstruction* context) : OpKernel(context) {
+                 OP_REQUIRES_OK(context,
+                   context->GetAttr("pool_height", &pool_height_));
+
+                 OP_REQUIRES_OK(context,
+                   context->GetAttr("pool_width", &pool_width_));
+        }
+
+
+        void Compute(OpKernelContext* context) override {
+            // Grab the input tensor
+            const Tensor& orig_input_tensor = context->input(0);
+            const Tensor& orig_rois_tensor = context->input(1);
+            const Tensor& orig_output_tensor = context->input(2);
+            const Tensor& orig_argmax_output_tensor = context->input(3);
+            const Tensor& orig_output_grad_tensor = context->input(4);
+
+            auto orig_input = orig_input_tensor.flat<float>();
+            auto orig_rois = orig_rois_tensor.flat<int32>();
+            auto orig_output = orig_output_tensor.flat<float>();
+            auto orig_argmax_output = orig_argmax_output_tensor.flat<int32>();
+            auto orig_output_grad = orig_output_grad_tensor.flat<float>();
+
+            // Create an output tensor
+            Tensor* output_tensor = NULL;
+            auto orig_input_shape = orig_input_tensor.shape();
+            auto orig_rois_shape = orig_rois_tensor.shape();
+            auto grads_shape = orig_input_shape;
+
+            int mb_size = orig_input_shape.dim_size(0);
+            int n_rois = orig_rois_shape.dim_size(0);
+            int height = orig_input_shape.dim_size(1);
+            int width = orig_input_shape.dim_size(2);
+            int channels = orig_input_shape.dim_size(3);
+
+            OP_REQUIRES_OK(context, context->allocate_output(0, grads_shape,
+                        &output_tensor));
+
+            auto output = output_tensor->template flat<float>();
+
+            // Call the cuda kernel launcher
+            RoiPoolingGradKernelLauncher(orig_input.data(), orig_rois.data(),
+                mb_size, n_rois, channels, height, width, pool_height_, pool_width_,
+                orig_output.data(), orig_argmax_output.data(), orig_output_grad.data(), output.data());
+        }
+};
+
+
+REGISTER_KERNEL_BUILDER(Name("RoiPoolingGrad").Device(DEVICE_GPU), RoiPoolingGradOp);
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+.ipynb_checkpoints/`
	`2`	`+build/`
	`3`	`+`