GlibAI
diff --git a/‎resnet/BUILD
Lines changed: 40 additions & 0 deletions b/‎resnet/BUILD
Lines changed: 40 additions & 0 deletions
diff --git a/‎resnet/README.md
Lines changed: 103 additions & 0 deletions b/‎resnet/README.md
Lines changed: 103 additions & 0 deletions
diff --git a/‎resnet/cifar_input.py
Lines changed: 115 additions & 0 deletions b/‎resnet/cifar_input.py
Lines changed: 115 additions & 0 deletions
diff --git a/‎resnet/g3doc/cifar_resnet.gif
14.2 KB b/‎resnet/g3doc/cifar_resnet.gif
14.2 KB
diff --git a/‎resnet/g3doc/cifar_resnet_legends.gif
4.49 KB b/‎resnet/g3doc/cifar_resnet_legends.gif
4.49 KB
@@ -0,0 +1,40 @@
+package(default_visibility = [":internal"])
+
+licenses(["notice"])  # Apache 2.0
+
+exports_files(["LICENSE"])
+
+package_group(
+    name = "internal",
+    packages = [
+        "//resnet/...",
+    ],
+)
+
+filegroup(
+    name = "py_srcs",
+    data = glob([
+        "**/*.py",
+    ]),
+)
+
+py_library(
+    name = "resnet_model",
+    srcs = ["resnet_model.py"],
+)
+
+py_binary(
+    name = "resnet_main",
+    srcs = [
+        "resnet_main.py",
+    ],
+    deps = [
+        ":cifar_input",
+        ":resnet_model",
+    ],
+)
+
+py_library(
+    name = "cifar_input",
+    srcs = ["cifar_input.py"],
+)
@@ -0,0 +1,103 @@
+<font size=4><b>Reproduced ResNet on CIFAR-10 and CIFAR-100 dataset.</b></font>
+
+contact: panyx0718 ([email protected])
+
+<b>Dataset:</b>
+
+https://www.cs.toronto.edu/~kriz/cifar.html
+
+<b>Related papers:</b>
+
+Identity Mappings in Deep Residual Networks
+
+https://arxiv.org/pdf/1603.05027v2.pdf
+
+Deep Residual Learning for Image Recognition
+
+https://arxiv.org/pdf/1512.03385v1.pdf
+
+Wide Residual Networks
+
+https://arxiv.org/pdf/1605.07146v1.pdf
+
+<b>Settings:</b>
+
+* Random split 50k training set into 45k/5k train/eval split.
+* Pad to 36x36 and random crop. Horizontal flip. Per-image whitenting. 
+* Momentum optimizer 0.9.
+* Learning rate schedule: 0.1 (40k), 0.01 (60k), 0.001 (>60k).
+* L2 weight decay: 0.002.
+* Batch size: 128. (28-10 wide and 1001 layer bottleneck use 64)
+
+<b>Results:</b>
+
+<left>
+![Precisions](g3doc/cifar_resnet.gif)
+</left>
+<left>
+![Precisions Legends](g3doc/cifar_resnet_legends.gif)
+</left>
+
+
+CIFAR-10 Model|Best Precision|Steps
+--------------|--------------|------
+32 layer|92.5%|~80k
+110 layer|93.6%|~80k
+164 layer bottleneck|94.5%|~80k
+1001 layer bottleneck|94.9%|~80k
+28-10 wide|95%|~90k
+
+CIFAR-100 Model|Best Precision|Steps
+---------------|--------------|-----
+32 layer|68.1%|~45k
+110 layer|71.3%|~60k
+164 layer bottleneck|75.7%|~50k
+1001 layer bottleneck|78.2%|~70k
+28-10 wide|78.3%|~70k
+
+<b>Prerequisite:</b>
+
+1. Install TensorFlow, Bazel.
+
+2. Download CIFAR-10/CIFAR-100 dataset.
+
+```shell
+curl -o cifar-10-binary.tar.gz https://www.cs.toronto.edu/~kriz/cifar-10-binary.tar.gz
+curl -o cifar-100-binary.tar.gz https://www.cs.toronto.edu/~kriz/cifar-100-binary.tar.gz
+```
+
+<b>How to run:</b>
+
+```shell
+# cd to the your workspace.
+# It contains an empty WORKSPACE file, resnet codes and cifar10 dataset.
+ls -R
+  .:
+  cifar10  resnet  WORKSPACE
+
+  ./cifar10:
+  test.bin  train.bin  validation.bin
+
+  ./resnet:
+  BUILD  cifar_input.py  g3doc  README.md  resnet_main.py  resnet_model.py
+
+# Build everything for GPU.
+bazel build -c opt --config=cuda resnet/...
+
+# Train the model.
+bazel-bin/resnet/resnet_main --train_data_path=cifar10/train.bin \
+                             --log_root=/tmp/resnet_model \
+                             --train_dir=/tmp/resnet_model/train \
+                             --dataset='cifar10' \
+                             --num_gpus=1
+
+# Evaluate the model.
+# Avoid running on the same GPU as the training job at the same time,
+# otherwise, you might run out of memory.
+bazel-bin/resnet/resnet_main --eval_data_path=cifar10/test.bin \
+                             --log_root=/tmp/resnet_model \
+                             --eval_dir=/tmp/resnet_model/test \
+                             --mode=eval \
+                             --dataset='cifar10' \
+                             --num_gpus=0
+```
@@ -0,0 +1,115 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""CIFAR dataset input module.
+"""
+
+import tensorflow as tf
+
+
+def build_input(dataset, data_path, batch_size, mode):
+  """Build CIFAR image and labels.
+
+  Args:
+    dataset: Either 'cifar10' or 'cifar100'.
+    data_path: Filename for data.
+    batch_size: Input batch size.
+    mode: Either 'train' or 'eval'.
+  Returns:
+    images: Batches of images. [batch_size, image_size, image_size, 3]
+    labels: Batches of labels. [batch_size, num_classes]
+  Raises:
+    ValueError: when the specified dataset is not supported.
+  """
+  image_size = 32
+  if dataset == 'cifar10':
+    label_bytes = 1
+    label_offset = 0
+    num_classes = 10
+  elif dataset == 'cifar100':
+    label_bytes = 1
+    label_offset = 1
+    num_classes = 100
+  else:
+    raise ValueError('Not supported dataset %s', dataset)
+
+  depth = 3
+  image_bytes = image_size * image_size * depth
+  record_bytes = label_bytes + label_offset + image_bytes
+
+  file_queue = tf.train.string_input_producer([data_path], shuffle=True)
+  # Read examples from files in the filename queue.
+  reader = tf.FixedLengthRecordReader(record_bytes=record_bytes)
+  _, value = reader.read(file_queue)
+
+  # Convert these examples to dense labels and processed images.
+  record = tf.reshape(tf.decode_raw(value, tf.uint8), [record_bytes])
+  label = tf.cast(tf.slice(record, [label_offset], [label_bytes]), tf.int32)
+  # Convert from string to [depth * height * width] to [depth, height, width].
+  depth_major = tf.reshape(tf.slice(record, [label_bytes], [image_bytes]),
+                           [depth, image_size, image_size])
+  # Convert from [depth, height, width] to [height, width, depth].
+  image = tf.cast(tf.transpose(depth_major, [1, 2, 0]), tf.float32)
+
+  if mode == 'train':
+    image = tf.image.resize_image_with_crop_or_pad(
+        image, image_size+4, image_size+4)
+    image = tf.random_crop(image, [image_size, image_size, 3])
+    image = tf.image.random_flip_left_right(image)
+    # Brightness/saturation/constrast provides small gains .2%~.5% on cifar.
+    # image = tf.image.random_brightness(image, max_delta=63. / 255.)
+    # image = tf.image.random_saturation(image, lower=0.5, upper=1.5)
+    # image = tf.image.random_contrast(image, lower=0.2, upper=1.8)
+    image = tf.image.per_image_whitening(image)
+
+    example_queue = tf.RandomShuffleQueue(
+        capacity=16 * batch_size,
+        min_after_dequeue=8 * batch_size,
+        dtypes=[tf.float32, tf.int32],
+        shapes=[[image_size, image_size, depth], [1]])
+    num_threads = 16
+  else:
+    image = tf.image.resize_image_with_crop_or_pad(
+        image, image_size, image_size)
+    image = tf.image.per_image_whitening(image)
+
+    example_queue = tf.FIFOQueue(
+        3 * batch_size,
+        dtypes=[tf.float32, tf.int32],
+        shapes=[[image_size, image_size, depth], [1]])
+    num_threads = 1
+
+  example_enqueue_op = example_queue.enqueue([image, label])
+  tf.train.add_queue_runner(tf.train.queue_runner.QueueRunner(
+      example_queue, [example_enqueue_op] * num_threads))
+
+  # Read 'batch' labels + images from the example queue.
+  images, labels = example_queue.dequeue_many(batch_size)
+  labels = tf.reshape(labels, [batch_size, 1])
+  indices = tf.reshape(tf.range(0, batch_size, 1), [batch_size, 1])
+  labels = tf.sparse_to_dense(
+      tf.concat(1, [indices, labels]),
+      [batch_size, num_classes], 1.0, 0.0)
+
+  assert len(images.get_shape()) == 4
+  assert images.get_shape()[0] == batch_size
+  assert images.get_shape()[-1] == 3
+  assert len(labels.get_shape()) == 2
+  assert labels.get_shape()[0] == batch_size
+  assert labels.get_shape()[1] == num_classes
+
+  # Display the training images in the visualizer.
+  tf.image_summary('images', images)
+  return images, labels