update docs. cleanup scripts

6dce5c4b · Yuxin Wu · acae3fe5 · 6dce5c4b · 6dce5c4b · acae3fe5
Commit 6dce5c4b authored Mar 08, 2018 by Yuxin Wu
6 changed files
--- a/README.md
+++ b/README.md
@@ -13,7 +13,7 @@ It's Yet Another TF wrapper, but different in:

 1. Focus on __training speed__.
 	+	Speed comes for free with tensorpack -- it uses TensorFlow in the __efficient way__ with no extra overhead.
-	  On various CNNs, it runs 1.5~1.7x faster than the equivalent Keras code.
+	  On various CNNs, it runs 1.1~2x faster than the equivalent Keras code.

 	+ Data-parallel multi-GPU training is off-the-shelf to use. It runs as fast as Google's [official benchmark](https://www.tensorflow.org/performance/benchmarks).


--- a/examples/HED/README.md
+++ b/examples/HED/README.md
@@ -12,10 +12,10 @@ for other FCN tasks such as semantic segmentation and detection.

 ## Usage

-This script only needs the original BSDS dataset and applies augmentation on the fly.
+This script needs the original BSDS dataset and applies augmentation on the fly.
 It will automatically download the dataset to `$TENSORPACK_DATASET/` if not there.

-It requires pretrained vgg16 model. See the docs in [examples/load-vgg16.py](../load-vgg16.py)
+It requires pretrained vgg16 model. See the docs in [examples/CaffeModels](../CaffeModels)
 for instructions to convert from vgg16 caffe model.

 To view augmented training images:
@@ -34,11 +34,3 @@ To inference (produce a heatmap at each level at out*.png):
 ./hed.py --load pretrained.model --run a.jpg
 ```
 Models I trained can be downloaded [here](http://models.tensorpack.com/HED/).
-
-To view the loss curve:
-```bash
-cat train_log/hed/stat.json | jq '.[] |
-"\(.xentropy1)\t\(.xentropy2)\t\(.xentropy3)\t\(.xentropy4)\t\(.xentropy5)\t\(.xentropy6)"' -r | \
-				tpk-plot-point --legend 1,2,3,4,5,final --decay 0.8
-```
-Or just open tensorboard.
--- a/scripts/dump-dataflow.py
+++ b/scripts/dump-dataflow.py
-#!/usr/bin/env python
-# -*- coding: UTF-8 -*-
-# File: dump-dataflow.py
-# Author: Yuxin Wu <ppwwyyxx@gmail.com>
-
-import argparse
-import cv2
-import imp
-import tqdm
-import os
-from tensorpack.utils import logger
-from tensorpack.utils.fs import mkdir_p
-from tensorpack.dataflow import RepeatedData
-
-
-parser = argparse.ArgumentParser()
-parser.add_argument(dest='config')
-parser.add_argument('-o', '--output',
-                    help='output directory to dump dataset image. If not given, will not dump images.')
-parser.add_argument('-s', '--scale',
-                    help='scale the image data (maybe by 255)', default=1, type=int)
-parser.add_argument('--index',
-                    help='index of the image component in datapoint',
-                    default=0, type=int)
-parser.add_argument('-n', '--number', help='number of images to dump',
-                    default=10, type=int)
-args = parser.parse_args()
-logger.auto_set_dir(action='d')
-
-get_config_func = imp.load_source('config_script', args.config).get_config
-config = get_config_func()
-config.dataset.reset_state()
-
-if args.output:
-    mkdir_p(args.output)
-    cnt = 0
-    index = args.index   # TODO: as an argument?
-    for dp in config.dataset.get_data():
-        imgbatch = dp[index]
-        if cnt > args.number:
-            break
-        for bi, img in enumerate(imgbatch):
-            cnt += 1
-            fname = os.path.join(args.output, '{:03d}-{}.png'.format(cnt, bi))
-            cv2.imwrite(fname, img * args.scale)
-
-NR_DP_TEST = args.number
-logger.info("Testing dataflow speed:")
-ds = RepeatedData(config.dataset, -1)
-with tqdm.tqdm(total=NR_DP_TEST, leave=True, unit='data points') as pbar:
-    for idx, dp in enumerate(ds.get_data()):
-        del dp
-        if idx > NR_DP_TEST:
-            break
-        pbar.update()
--- a/scripts/plot-point.py
+++ b/scripts/plot-point.py
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-"""
-A general curve plotter to create curves such as:
-https://github.com/ppwwyyxx/tensorpack/tree/master/examples/ResNet
-
-A simplest example:
-$ cat examples/train_log/mnist-convnet/stat.json \
-        | jq '.[] | .train_error, .validation_error' \
-        | paste - - \
-        | plot-point.py --legend 'train,val' --xlabel 'epoch' --ylabel 'error'
-
-For more usage, see `plot-point.py -h` or the code.
-"""
-
-import numpy as np
-import matplotlib.pyplot as plt
-import matplotlib.font_manager as fontm
-import argparse
-import sys
-from collections import defaultdict
-from itertools import chain
-import six
-
-# from matplotlib import rc
-# rc('font',**{'family':'sans-serif','sans-serif':['Helvetica']})
-# rc('font',**{'family':'sans-serif','sans-serif':['Microsoft Yahei']})
-# rc('text', usetex=True)
-
-STDIN_FNAME = '-'
-
-
-def get_args():
-    description = "plot points into graph."
-    parser = argparse.ArgumentParser(description=description)
-    parser.add_argument('-i', '--input',
-                        help='input data file, use "-" for stdin. Default stdin. Input \
-            format is many rows of DELIMIETER-separated data',
-                        default='-')
-    parser.add_argument('-o', '--output',
-                        help='output image', default='')
-    parser.add_argument('--show',
-                        help='show the figure after rendered',
-                        action='store_true')
-    parser.add_argument('-c', '--column',
-                        help="describe each column in data, for example 'x,y,y'. \
-            Default to 'y' for one column and 'x,y' for two columns. \
-            Plot attributes can be appended after 'y', like 'ythick;cr'. \
-            By default, assume all columns are y. \
-            ")
-    parser.add_argument('-t', '--title',
-                        help='title of the graph',
-                        default='')
-    parser.add_argument('--xlabel',
-                        help='x label', type=six.text_type)
-    parser.add_argument('--ylabel',
-                        help='y label', type=six.text_type)
-    parser.add_argument('--xlim',
-                        help='x lim', type=float, nargs=2)
-    parser.add_argument('--ylim',
-                        help='y lim', type=float, nargs=2)
-    parser.add_argument('-s', '--scale',
-                        help='scale of each y, separated by comma')
-    parser.add_argument('--annotate-maximum',
-                        help='annonate maximum value in graph',
-                        action='store_true')
-    parser.add_argument('--annotate-minimum',
-                        help='annonate minimum value in graph',
-                        action='store_true')
-    parser.add_argument('--xkcd',
-                        help='xkcd style',
-                        action='store_true')
-    parser.add_argument('--decay',
-                        help='exponential decay rate to smooth Y',
-                        type=float, default=0)
-    parser.add_argument('-l', '--legend',
-                        help='legend for each y')
-    parser.add_argument('-d', '--delimeter',
-                        help='column delimeter', default='\t')
-
-    global args
-    args = parser.parse_args()
-
-    if not args.show and not args.output:
-        args.show = True
-
-
-def read_entire_matrix():
-    # parse input args
-    if args.input == STDIN_FNAME:
-        fin = sys.stdin
-    else:
-        fin = open(args.input)
-    all_lines = fin.readlines()
-    if args.input != STDIN_FNAME:
-        fin.close()
-
-    nr_column = len(all_lines[0].rstrip('\n').split(args.delimeter))
-    # read the entire matrix to 'data'
-    data = [[] for _ in range(nr_column)]
-    ended = defaultdict(bool)
-    for lineno, line in enumerate(all_lines):
-        line = line.rstrip('\n').split(args.delimeter)
-        assert len(line) <= nr_column, \
-            """One row have too many columns (separated by {})!
-Line: {}""".format(repr(args.delimeter), line)
-        for idx, val in enumerate(line):
-            if val == '':
-                ended[idx] = True
-                continue
-            else:
-                val = float(val)
-                assert not ended[idx], "Column {} has hole!".format(idx)
-                data[idx].append(val)
-    return data
-
-
-class Sequence(object):
-    def __init__(self, xs, ys, plot_args=None):
-        """
-        Args:
-            xs, ys: a list of floats
-        """
-        self.xs = np.copy(np.asarray(xs))
-        self.ys = np.asarray(ys)
-
-        assert len(xs) >= len(ys), \
-            "x column is shorter than y column! {} < {}".format(len(xs), len(ys))
-        self.xs = self.xs[:len(ys)]
-
-        if plot_args is None:
-            plot_args = {}
-        self.plot_args = plot_args
-        self.legend = None
-
-        self.drawables = []
-
-    def exponential_smooth(self, alpha):
-        """ smooth data by alpha."""
-        data = self.ys
-        ret = np.copy(data)
-        now = data[0]
-        for k in range(len(data)):
-            ret[k] = now * alpha + data[k] * (1 - alpha)
-            now = ret[k]
-        self.ys = ret
-
-    def scale_y(self, scale):
-        if scale == 1.0:
-            return
-        self.ys *= scale
-        if self.legend:
-            self.legend = "{},scaley={:.2g}".format(self.legend, scale)
-
-    @property
-    def xrange(self):
-        return np.array([min(self.xs), max(self.xs)])
-
-    def toggle_vis(self):
-        assert len(self.drawables), "Called before plot()!"
-        vis = not self.drawables[0].get_visible()
-        for d in self.drawables:
-            d.set_visible(vis)
-        return vis
-
-
-def annotate_min_max(data_x, data_y, ax):
-    """
-    Annotate on top of ax, given one sequence of X and Y.
-    """
-
-    def filter_valid_range(points, rect):
-        """rect = (min_x, max_x, min_y, max_y)"""
-        ret = []
-        for x, y in points:
-            if x >= rect[0] and x <= rect[1] and y >= rect[2] and y <= rect[3]:
-                ret.append((x, y))
-        if len(ret) == 0:
-            ret.append(points[0])
-        return ret
-
-    max_x, min_x = max(data_x), min(data_x)
-    max_y, min_y = max(data_y), min(data_y)
-    x_range = max_x - min_x
-    y_range = max_y - min_y
-    x_max, y_max = data_y[0], data_y[0]
-    x_min, y_min = data_x[0], data_y[0]
-
-    for i in range(1, len(data_x)):
-        if data_y[i] > y_max:
-            y_max = data_y[i]
-            x_max = data_x[i]
-        if data_y[i] < y_min:
-            y_min = data_y[i]
-            x_min = data_x[i]
-
-    rect = ax.axis()
-    if args.annotate_maximum:
-        text_x, text_y = filter_valid_range([
-            (x_max + 0.05 * x_range,
-                y_max + 0.025 * y_range),
-            (x_max - 0.05 * x_range,
-                y_max + 0.025 * y_range),
-            (x_max + 0.05 * x_range,
-                y_max - 0.025 * y_range),
-            (x_max - 0.05 * x_range,
-                y_max - 0.025 * y_range)],
-            rect)[0]
-        ax.annotate('maximum ({:d},{:.3f})' . format(int(x_max), y_max),
-                    xy=(x_max, y_max),
-                    xytext=(text_x, text_y),
-                    arrowprops=dict(arrowstyle='->'))
-    if args.annotate_minimum:
-        text_x, text_y = filter_valid_range([
-            (x_min + 0.05 * x_range,
-                y_min - 0.025 * y_range),
-            (x_min - 0.05 * x_range,
-                y_min - 0.025 * y_range),
-            (x_min + 0.05 * x_range,
-                y_min + 0.025 * y_range),
-            (x_min - 0.05 * x_range,
-                y_min + 0.025 * y_range)],
-            rect)[0]
-        ax.annotate('minimum ({:d},{:.3f})' . format(int(x_min), y_min),
-                    xy=(x_min, y_min),
-                    xytext=(text_x, text_y),
-                    arrowprops=dict(arrowstyle='->'))
-        # ax.annotate('{:.3f}' . format(y_min),
-        # xy = (x_min, y_min),
-        # xytext = (text_x, text_y),
-        # arrowprops = dict(arrowstyle = '->'))
-
-
-def plot_args_from_column_desc(desc):
-    if not desc:
-        return {}
-    ret = {}
-    desc = desc.split(';')
-    if 'thick' in desc:
-        ret['lw'] = 5
-    if 'dash' in desc:
-        ret['ls'] = '--'
-    for v in desc:
-        if v.startswith('c'):
-            ret['color'] = v[1:]
-    return ret
-
-
-def do_plot(seqs):
-    """
-    seqs: [Sequence]
-    """
-    fig = plt.figure(figsize=(16.18 / 1.2, 10 / 1.2))
-    ax = fig.add_axes((0.1, 0.2, 0.8, 0.7))
-
-    for seq in seqs:
-        curve_obj = plt.plot(seq.xs, seq.ys, label=seq.legend, **seq.plot_args)[0]
-
-        c = curve_obj.get_color()
-        fill_obj = plt.fill_between(seq.xs, seq.ys, alpha=0.1, facecolor=c)
-
-        if args.annotate_maximum or args.annotate_minimum:
-            annotate_min_max(seq.xs, seq.ys, ax)
-
-        seq.drawables.extend([curve_obj, fill_obj])
-
-    # deal with label and xlim
-    if args.xlabel:
-        plt.xlabel(args.xlabel, fontsize='xx-large')
-    if args.ylabel:
-        plt.ylabel(args.ylabel, fontsize='xx-large')
-    if args.xlim:
-        plt.xlim(args.xlim[0], args.xlim[1])
-    else:
-        # adjust maxx
-        all_xrange = np.asarray([s.xrange for s in seqs])
-        minx, maxx = min(all_xrange[:, 0]), max(all_xrange[:, 1])
-        new_maxx = maxx + (maxx - minx) * 0.05
-        plt.xlim(minx, new_maxx)
-    if args.ylim:
-        plt.ylim(args.ylim[0], args.ylim[1])
-
-    legend_obj = plt.legend(loc='best', fontsize='xx-large')
-
-    # setup click behavior
-    legend_line_to_seq = {}
-    for legend_line, seq in zip(legend_obj.get_lines(), seqs):
-        legend_line.set_picker(5)
-        legend_line_to_seq[legend_line] = seq
-
-    def onclick(event):
-        legline = event.artist
-        seq = legend_line_to_seq[legline]
-        vis = seq.toggle_vis()
-        legline.set_alpha(1.0 if vis else 0.2)
-        fig.canvas.draw()
-
-    fig.canvas.mpl_connect('pick_event', onclick)
-
-    for label in chain.from_iterable(
-            [ax.get_xticklabels(), ax.get_yticklabels()]):
-        label.set_fontproperties(fontm.FontProperties(size=15))
-
-    ax.grid(color='gray', linestyle='dashed')
-    plt.title(args.title, fontdict={'fontsize': '20'})
-    if args.output != '':
-        plt.savefig(args.output, bbox_inches='tight')
-    if args.show:
-        plt.show()
-
-
-def main():
-    get_args()
-    data = read_entire_matrix()     # #col x #row
-
-    # parse column format
-    nr_column = len(data)
-    if args.column is None:
-        column = ['y'] * nr_column
-    else:
-        column = args.column.strip().split(',')
-    for k in column:
-        assert k[0] in ['x', 'y', 'n']
-    assert nr_column == len(column), "Column and data doesn't have same length. {}!={}".format(nr_column, len(column))
-
-    # split data into Xs and Ys
-    data_xs, data_ys, desc_ys = [], [], []   # #col x #row
-    for column_data, column_desc in zip(data, column):
-        if column_desc[0] == 'y':
-            data_ys.append(column_data)
-            desc_ys.append(column_desc)
-        elif column_desc[0] == 'x':
-            data_xs.append(column_data)
-    num_curve = len(data_ys)
-    length_ys = [len(t) for t in data_ys]
-    print("Length of each Y column:", length_ys)
-
-    # populate default xs
-    if len(data_xs) > 1:
-        assert len(data_xs) == num_curve, \
-            "If multiple x columns are used, num_x_column must equals to nr_y_column"
-    elif len(data_xs) == 1:
-        data_xs = data_xs * num_curve
-    else:
-        data_xs = [list(range(1, max(length_ys) + 1))] * num_curve
-
-    # put into seq
-    seqs = []
-    assert len(data_xs) == len(data_ys)
-    for idx, (X, Y) in enumerate(zip(data_xs, data_ys)):
-        col_desc = desc_ys[idx]
-        seqs.append(Sequence(
-            X, Y,
-            plot_args=plot_args_from_column_desc(col_desc[1:])))
-
-    if args.decay != 0:
-        for s in seqs:
-            s.exponential_smooth(args.decay)
-        # if idx == 0:   # TODO allow different decay for each y
-            # data_ys[idx] = exponential_smooth(data_y, 0.5)
-
-    if args.legend:
-        legends = args.legend.split(',')
-        assert len(legends) == num_curve
-        for legend, seq in zip(legends, seqs):
-            seq.legend = legend
-
-    if args.scale:
-        scales = list(map(float, args.scale.split(',')))
-        assert len(scales) == num_curve
-        for scale, seq in zip(scales, seqs):
-            seq.scale_y(scale)
-
-    if args.xkcd:
-        with plt.xkcd():
-            do_plot(seqs)
-    else:
-        do_plot(seqs)
-
-
-if __name__ == '__main__':
-    main()
--- a/scripts/serve-data.py
+++ b/scripts/serve-data.py
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-# File: serve-data.py
-# Author: Yuxin Wu <ppwwyyxxc@gmail.com>
-
-import argparse
-import imp
-from tensorpack.dataflow import serve_data
-
-parser = argparse.ArgumentParser()
-parser.add_argument(dest='config')
-parser.add_argument('-p', '--port', help='port', type=int, required=True)
-args = parser.parse_args()
-
-get_config_func = imp.load_source('config_script', args.config).get_config
-config = get_config_func()
-
-ds = config.dataset
-serve_data(ds, "tcp://*:{}".format(args.port))
--- a/tensorpack/input_source/input_source.py
+++ b/tensorpack/input_source/input_source.py
@@ -515,7 +515,8 @@ class StagingInput(FeedfreeInput):
                    element should be sufficient.
            towers: deprecated
            device (str or None): if not None, place the StagingArea on a specific device. e.g., '/cpu:0'.
-                Otherwise, they are placed under where `get_inputs_tensors` gets called.
+                Otherwise, they are placed under where `get_inputs_tensors`
+                gets called, which could be unspecified in case of simple trainers.
        """
        assert isinstance(input, FeedfreeInput), input
        self._input = input