deform augmentation

47cbfe87 · Yuxin Wu · 2d923b91 · 47cbfe87 · 47cbfe87
Commit 47cbfe87 authored Feb 23, 2016 by Yuxin Wu
Hide whitespace changes
Inline Side-by-side

Showing with 99 additions and 8 deletions

tensorpack/dataflow/imgaug/_test.py tensorpack/dataflow/imgaug/_test.py +13 -8

tensorpack/dataflow/imgaug/deform.py tensorpack/dataflow/imgaug/deform.py +86 -0

No files found.
--- a/tensorpack/dataflow/imgaug/_test.py
+++ b/tensorpack/dataflow/imgaug/_test.py
@@ -3,16 +3,21 @@
 # File: _test.py
 # Author: Yuxin Wu <ppwwyyxx@gmail.com>
+import sys
 import cv2
-from . import *
+from . import AugmentorList, Flip, GaussianDeform, Image
+anchors = [(0.2, 0.2), (0.8, 0.8), (0.5, 0.5), (0.2, 0.5)]
 augmentors = AugmentorList([
-    Contrast((0.2,1.8)),
+    #Contrast((0.2,1.8)),
-    Flip(horiz=True)
+    #Flip(horiz=True),
+    GaussianDeform(anchors, (360,480), 1, randrange=10)
 ])
-img = cv2.imread('cat.jpg')
+while True:
-img = Image(img)
+    img = cv2.imread(sys.argv[1])
-augmentors.augment(img)
+    img = Image(img)
-cv2.imshow(" ", img.arr)
+    augmentors.augment(img)
-cv2.waitKey()
+    cv2.imshow(" ", img.arr.astype('uint8'))
+    cv2.waitKey()
--- a/tensorpack/dataflow/imgaug/deform.py
+++ b/tensorpack/dataflow/imgaug/deform.py
+#!/usr/bin/env python2
+# -*- coding: UTF-8 -*-
+# File: deform.py
+# Author: Yuxin Wu <ppwwyyxx@gmail.com>
+from .base import ImageAugmentor
+import numpy as np
+__all__ = ['GaussianDeform', 'GaussianMap']
+class GaussianMap(object):
+    def __init__(self, image_shape, sigma=0.5):
+        assert len(image_shape) == 2
+        self.shape = image_shape
+        self.sigma = sigma
+    def get_gaussian_weight(self, anchor):
+        ret = np.zeros(self.shape, dtype='float32')
+        y, x = np.mgrid[:self.shape[0], :self.shape[1]]
+        y = y.astype('float32') / ret.shape[0] - anchor[0]
+        x = x.astype('float32') / ret.shape[1] - anchor[1]
+        g = np.exp(-(x**2 + y ** 2) / self.sigma)
+        #cv2.imshow(" ", g)
+        #cv2.waitKey()
+        return g
+def np_sample(img, coords):
+    # a numpy implementation of ImageSample layer
+    coords = np.maximum(coords, 0)
+    coords = np.minimum(coords, np.array([img.shape[0]-1, img.shape[1]-1]))
+    lcoor = np.floor(coords).astype('int32')
+    ucoor = lcoor + 1
+    ucoor = np.minimum(ucoor, np.array([img.shape[0]-1, img.shape[1]-1]))
+    diff = coords - lcoor
+    neg_diff = 1.0 - diff
+    lcoory, lcoorx = np.split(lcoor, 2, axis=2)
+    ucoory, ucoorx = np.split(ucoor, 2, axis=2)
+    diff = np.repeat(diff, 3, 2).reshape((diff.shape[0], diff.shape[1], 2, 3))
+    neg_diff = np.repeat(neg_diff, 3, 2).reshape((diff.shape[0], diff.shape[1], 2, 3))
+    diffy, diffx = np.split(diff, 2, axis=2)
+    ndiffy, ndiffx = np.split(neg_diff, 2, axis=2)
+    ret = img[lcoory,lcoorx,:] * ndiffx * ndiffy + \
+            img[ucoory, ucoorx,:] * diffx * diffy + \
+            img[lcoory, ucoorx,:] * ndiffy * diffx + \
+            img[ucoory,lcoorx,:] * diffy * ndiffx
+    return ret[:,:,0,:]
+# TODO input/output with different shape
+class GaussianDeform(ImageAugmentor):
+    """
+    Some kind of deformation
+    """
+    #TODO docs
+    def __init__(self, anchors, shape, sigma=0.5, randrange=None):
+        """
+        anchors: in [0,1] coordinate
+        shape: 2D image shape
+        randrange: default to shape[0] / 8
+        """
+        self.anchors = anchors
+        self.K = len(self.anchors)
+        self.shape = shape
+        self.grid = np.mgrid[0:self.shape[0], 0:self.shape[1]].transpose(1,2,0)
+        self.grid = self.grid.astype('float32') # HxWx2
+        gm = GaussianMap(self.shape, sigma=sigma)
+        self.gws = np.array([gm.get_gaussian_weight(ank)
+                             for ank in self.anchors], dtype='float32') # KxHxW
+        self.gws = self.gws.transpose(1, 2, 0)  #HxWxK
+        if randrange is None:
+            self.randrange = self.shape[0] / 8
+        else:
+            self.randrange = randrange
+        self._init()
+    def _augment(self, img):
+        if img.coords:
+            raise NotImplementedError()
+        v = self.rng.rand(self.K, 2).astype('float32') - 0.5
+        v = v * 2 * self.randrange
+        grid = self.grid + np.dot(self.gws, v)
+        img.arr = np_sample(img.arr, grid)