Add script for classifying images, update gitignore.

2019-05-06 02:58:26 +02:00 · 2019-05-06 02:58:26 +02:00 · 0713f42692
commit 0713f42692
parent dfa0d87971
57 changed files with 290 additions and 14 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,4 +1,8 @@
-.vscode/*
-*/__pycache__/*
+.vscode/
+*/__pycache__/
 *tex
-Images/TrainingImages/*
+Images/TrainingImages/
+Model/bottleneck/
+Model/retrain_logs/
+Model/variables/
+Model/*.pb_log/
--- a/Images/TestImages/glass1.jpg
+++ b/Images/TestImages/glass1.jpg
--- a/Images/TestImages/glass100.jpg
+++ b/Images/TestImages/glass100.jpg
--- a/Images/TestImages/glass110.jpg
+++ b/Images/TestImages/glass110.jpg
--- a/Images/TestImages/glass113.jpg
+++ b/Images/TestImages/glass113.jpg
--- a/Images/TestImages/glass116.jpg
+++ b/Images/TestImages/glass116.jpg
--- a/Images/TestImages/glass122.jpg
+++ b/Images/TestImages/glass122.jpg
--- a/Images/TestImages/glass126.jpg
+++ b/Images/TestImages/glass126.jpg
--- a/Images/TestImages/glass156.jpg
+++ b/Images/TestImages/glass156.jpg
--- a/Images/TestImages/glass42.jpg
+++ b/Images/TestImages/glass42.jpg
--- a/Images/TestImages/glass43.jpg
+++ b/Images/TestImages/glass43.jpg
--- a/Images/TestImages/glass44.jpg
+++ b/Images/TestImages/glass44.jpg
--- a/Images/TestImages/glass46.jpg
+++ b/Images/TestImages/glass46.jpg
--- a/Images/TestImages/glass55.jpg
+++ b/Images/TestImages/glass55.jpg
--- a/Images/TestImages/glass59.jpg
+++ b/Images/TestImages/glass59.jpg
--- a/Images/TestImages/metal112.jpg
+++ b/Images/TestImages/metal112.jpg
--- a/Images/TestImages/metal20.jpg
+++ b/Images/TestImages/metal20.jpg
--- a/Images/TestImages/metal24.jpg
+++ b/Images/TestImages/metal24.jpg
--- a/Images/TestImages/metal27.jpg
+++ b/Images/TestImages/metal27.jpg
--- a/Images/TestImages/metal29.jpg
+++ b/Images/TestImages/metal29.jpg
--- a/Images/TestImages/metal31.jpg
+++ b/Images/TestImages/metal31.jpg
--- a/Images/TestImages/metal33.jpg
+++ b/Images/TestImages/metal33.jpg
--- a/Images/TestImages/metal50.jpg
+++ b/Images/TestImages/metal50.jpg
--- a/Images/TestImages/metal54.jpg
+++ b/Images/TestImages/metal54.jpg
--- a/Images/TestImages/metal86.jpg
+++ b/Images/TestImages/metal86.jpg
--- a/Images/TestImages/metal89.jpg
+++ b/Images/TestImages/metal89.jpg
--- a/Images/TestImages/metal94.jpg
+++ b/Images/TestImages/metal94.jpg
--- a/Images/TestImages/paper102.jpg
+++ b/Images/TestImages/paper102.jpg
--- a/Images/TestImages/paper111.jpg
+++ b/Images/TestImages/paper111.jpg
--- a/Images/TestImages/paper113.jpg
+++ b/Images/TestImages/paper113.jpg
--- a/Images/TestImages/paper118.jpg
+++ b/Images/TestImages/paper118.jpg
--- a/Images/TestImages/paper16.jpg
+++ b/Images/TestImages/paper16.jpg
--- a/Images/TestImages/paper20.jpg
+++ b/Images/TestImages/paper20.jpg
--- a/Images/TestImages/paper35.jpg
+++ b/Images/TestImages/paper35.jpg
--- a/Images/TestImages/paper46.jpg
+++ b/Images/TestImages/paper46.jpg
--- a/Images/TestImages/paper52.jpg
+++ b/Images/TestImages/paper52.jpg
--- a/Images/TestImages/paper56.jpg
+++ b/Images/TestImages/paper56.jpg
--- a/Images/TestImages/paper71.jpg
+++ b/Images/TestImages/paper71.jpg
--- a/Images/TestImages/paper72.jpg
+++ b/Images/TestImages/paper72.jpg
--- a/Images/TestImages/paper76.jpg
+++ b/Images/TestImages/paper76.jpg
--- a/Images/TestImages/paper94.jpg
+++ b/Images/TestImages/paper94.jpg
--- a/Images/TestImages/plastic1.jpg
+++ b/Images/TestImages/plastic1.jpg
--- a/Images/TestImages/plastic20.jpg
+++ b/Images/TestImages/plastic20.jpg
--- a/Images/TestImages/plastic32.jpg
+++ b/Images/TestImages/plastic32.jpg
--- a/Images/TestImages/plastic57.jpg
+++ b/Images/TestImages/plastic57.jpg
--- a/Images/TestImages/plastic73.jpg
+++ b/Images/TestImages/plastic73.jpg
--- a/Images/TestImages/plastic77.jpg
+++ b/Images/TestImages/plastic77.jpg
--- a/Images/TestImages/plastic78.jpg
+++ b/Images/TestImages/plastic78.jpg
--- a/Images/TestImages/plastic85.jpg
+++ b/Images/TestImages/plastic85.jpg
--- a/Images/TestImages/plastic91.jpg
+++ b/Images/TestImages/plastic91.jpg
--- a/Images/TestImages/plastic98.jpg
+++ b/Images/TestImages/plastic98.jpg
--- a/Logic/TrashRecognition/ImageClassification.py
+++ b/Logic/TrashRecognition/ImageClassification.py
@ -1 +1,156 @@
-import tensorflow as tf
+# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import argparse
+import os
+
+import numpy as np
+import tensorflow as tf
+
+
+def load_graph(model_file):
+  graph = tf.Graph()
+  graph_def = tf.GraphDef()
+
+  with open(model_file, "rb") as f:
+    graph_def.ParseFromString(f.read())
+  with graph.as_default():
+    tf.import_graph_def(graph_def)
+
+  return graph
+
+
+def read_tensor_from_image_file(file_name,
+                                input_height=299,
+                                input_width=299,
+                                input_mean=0,
+                                input_std=255):
+  input_name = "file_reader"
+  output_name = "normalized"
+  file_reader = tf.read_file(file_name, input_name)
+  if file_name.endswith(".png"):
+    image_reader = tf.image.decode_png(
+        file_reader, channels=3, name="png_reader")
+  elif file_name.endswith(".gif"):
+    image_reader = tf.squeeze(
+        tf.image.decode_gif(file_reader, name="gif_reader"))
+  elif file_name.endswith(".bmp"):
+    image_reader = tf.image.decode_bmp(file_reader, name="bmp_reader")
+  else:
+    image_reader = tf.image.decode_jpeg(
+        file_reader, channels=3, name="jpeg_reader")
+  float_caster = tf.cast(image_reader, tf.float32)
+  dims_expander = tf.expand_dims(float_caster, 0)
+  resized = tf.image.resize_bilinear(dims_expander, [input_height, input_width])
+  normalized = tf.divide(tf.subtract(resized, [input_mean]), [input_std])
+  sess = tf.Session()
+  result = sess.run(normalized)
+
+  return result
+
+
+def load_labels(label_file):
+  label = []
+  proto_as_ascii_lines = tf.gfile.GFile(label_file).readlines()
+  for l in proto_as_ascii_lines:
+    label.append(l.rstrip())
+  return label
+
+
+if __name__ == "__main__":
+  model_file = "Model/retrained_graph.pb"
+  label_file = "Model/retrained_labels.txt"
+  input_height = 299
+  input_width = 299
+  input_mean = 128
+  input_std = 128
+  input_layer = "input"
+  output_layer = "InceptionV3/Predictions/Reshape_1"
+
+  parser = argparse.ArgumentParser()
+
+  parser.add_argument("--graph",
+   default="Model/retrained_graph.pb",
+   help="graph/model to be executed")
+
+  parser.add_argument("--labels",
+   default="Model/retrained_labels.txt",
+   help="name of file containing labels")
+
+  parser.add_argument("--input_height", type=int, help="input height")
+
+  parser.add_argument("--input_width", type=int, help="input width")
+
+  parser.add_argument("--input_mean", type=int, help="input mean")
+
+  parser.add_argument("--input_std", type=int, help="input std")
+
+  parser.add_argument("--input_layer",
+   default="Placeholder",
+    help="name of input layer")
+
+  parser.add_argument("--output_layer",
+   default="final_result",
+   help="name of output layer")
+
+  args = parser.parse_args()
+
+  if args.graph:
+    model_file = args.graph
+  if args.labels:
+    label_file = args.labels
+  if args.input_height:
+    input_height = args.input_height
+  if args.input_width:
+    input_width = args.input_width
+  if args.input_mean:
+    input_mean = args.input_mean
+  if args.input_std:
+    input_std = args.input_std
+  if args.input_layer:
+    input_layer = args.input_layer
+  if args.output_layer:
+    output_layer = args.output_layer
+  
+  graph = load_graph(model_file)
+
+  for filename in os.listdir('Images/TestImages'):
+    t = read_tensor_from_image_file(
+      f'Images/TestImages/{filename}',
+      input_height=input_height,
+      input_width=input_width,
+      input_mean=input_mean,
+      input_std=input_std)
+    input_name = "import/" + input_layer
+    output_name = "import/" + output_layer
+    input_operation = graph.get_operation_by_name(input_name)
+    output_operation = graph.get_operation_by_name(output_name)
+
+    with tf.Session(graph=graph) as sess:
+      results = sess.run(output_operation.outputs[0], {
+          input_operation.outputs[0]: t
+      })
+    results = np.squeeze(results)
+
+    top_k = results.argsort()[-5:][::-1]
+    labels = load_labels(label_file)
+    print(f'{filename}: {labels[top_k[0]]} with {results[top_k[0]] * 100}% certainity')
+    # for i in top_k:
+    #   print(labels[i], results[i])
+ 
--- a/Logic/TrashRecognition/LoadGraphToTB.py
+++ b/Logic/TrashRecognition/LoadGraphToTB.py
@ -0,0 +1,22 @@
+import tensorflow as tf
+from tensorflow.python.platform import gfile
+import os
+
+def load_pb_to_log(filename):
+    with tf.Session() as sess:
+        with gfile.FastGFile(filename, 'rb') as f:
+            graph_def = tf.GraphDef()
+            graph_def.ParseFromString(f.read())
+            g_in = tf.import_graph_def(graph_def)
+    LOGDIR = f'{filename}_log'
+    train_writer = tf.summary.FileWriter(LOGDIR)
+    train_writer.add_graph(sess.graph)
+
+def main():
+    for filename in os.listdir('Model'):
+        fname, fext = os.path.splitext(filename)
+        if fext == '.pb':
+            load_pb_to_log(f'Model/{filename}')
+
+if __name__ == "__main__":
+    main()
--- a/Logic/TrashRecognition/Retrain.py
+++ b/Logic/TrashRecognition/Retrain.py
@ -15,6 +15,105 @@
 # NOTICE: This work was derived from tensorflow/examples/image_retraining
 # and modified to use TensorFlow Hub modules.

+# pylint: disable=line-too-long
+r"""Simple transfer learning with image modules from TensorFlow Hub.
+
+This example shows how to train an image classifier based on any
+TensorFlow Hub module that computes image feature vectors. By default,
+it uses the feature vectors computed by Inception V3 trained on ImageNet.
+For more options, search https://tfhub.dev for image feature vector modules.
+
+The top layer receives as input a 2048-dimensional vector (assuming
+Inception V3) for each image. We train a softmax layer on top of this
+representation. If the softmax layer contains N labels, this corresponds
+to learning N + 2048*N model parameters for the biases and weights.
+
+Here's an example, which assumes you have a folder containing class-named
+subfolders, each full of images for each label. The example folder flower_photos
+should have a structure like this:
+
+~/flower_photos/daisy/photo1.jpg
+~/flower_photos/daisy/photo2.jpg
+...
+~/flower_photos/rose/anotherphoto77.jpg
+...
+~/flower_photos/sunflower/somepicture.jpg
+
+The subfolder names are important, since they define what label is applied to
+each image, but the filenames themselves don't matter. (For a working example,
+download http://download.tensorflow.org/example_images/flower_photos.tgz
+and run  tar xzf flower_photos.tgz  to unpack it.)
+
+Once your images are prepared, and you have pip-installed tensorflow-hub and
+a sufficiently recent version of tensorflow, you can run the training with a
+command like this:
+
+```bash
+python retrain.py --image_dir ~/flower_photos
+```
+
+You can replace the image_dir argument with any folder containing subfolders of
+images. The label for each image is taken from the name of the subfolder it's
+in.
+
+This produces a new model file that can be loaded and run by any TensorFlow
+program, for example the tensorflow/examples/label_image sample code.
+
+By default this script will use the highly accurate, but comparatively large and
+slow Inception V3 model architecture. It's recommended that you start with this
+to validate that you have gathered good training data, but if you want to deploy
+on resource-limited platforms, you can try the `--tfhub_module` flag with a
+Mobilenet model. For more information on Mobilenet, see
+https://research.googleblog.com/2017/06/mobilenets-open-source-models-for.html
+
+For example:
+
+Run floating-point version of Mobilenet:
+
+```bash
+python retrain.py --image_dir ~/flower_photos \
+    --tfhub_module https://tfhub.dev/google/imagenet/mobilenet_v1_100_224/feature_vector/1
+```
+
+Run Mobilenet, instrumented for quantization:
+
+```bash
+python retrain.py --image_dir ~/flower_photos/ \
+    --tfhub_module https://tfhub.dev/google/imagenet/mobilenet_v1_100_224/quantops/feature_vector/1
+```
+
+These instrumented models can be converted to fully quantized mobile models via
+TensorFlow Lite.
+
+There are different Mobilenet models to choose from, with a variety of file
+size and latency options.
+  - The first number can be '100', '075', '050', or '025' to control the number
+    of neurons (activations of hidden layers); the number of weights (and hence
+    to some extent the file size and speed) shrinks with the square of that
+    fraction.
+  - The second number is the input image size. You can choose '224', '192',
+    '160', or '128', with smaller sizes giving faster speeds.
+
+To use with TensorBoard:
+
+By default, this script will log summaries to /tmp/retrain_logs directory
+
+Visualize the summaries with this command:
+
+tensorboard --logdir /tmp/retrain_logs
+
+To use with Tensorflow Serving, run this tool with --saved_model_dir set
+to some increasingly numbered export location under the model base path, e.g.:
+
+```bash
+python retrain.py (... other args as before ...) \
+    --saved_model_dir=/tmp/saved_models/$(date +%s)/
+tensorflow_model_server --port=9000 --model_name=my_image_classifier \
+    --model_base_path=/tmp/saved_models/
+```
+"""
+# pylint: enable=line-too-long
+
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
@ -1070,13 +1169,13 @@ if __name__ == '__main__':
  parser.add_argument(
      '--image_dir',
      type=str,
-      default='../../Images/TrainingImages',
+      default='Images/TrainingImages',
      help='Path to folders of labeled images.'
  )
  parser.add_argument(
      '--output_graph',
      type=str,
-      default='../../Model/retrained_graph.pb',
+      default='Model/output_graph.pb',
      help='Where to save the trained graph.'
  )
  parser.add_argument(
@ -1097,13 +1196,13 @@ if __name__ == '__main__':
  parser.add_argument(
      '--output_labels',
      type=str,
-      default='../../Model/retrained_labels.txt',
+      default='Model/output_labels.txt',
      help='Where to save the trained graph\'s labels.'
  )
  parser.add_argument(
      '--summaries_dir',
      type=str,
-      default='/retrain_logs',
+      default='Model/retrain_logs',
      help='Where to save summary logs for TensorBoard.'
  )
  parser.add_argument(
@ -1177,7 +1276,7 @@ if __name__ == '__main__':
  parser.add_argument(
      '--bottleneck_dir',
      type=str,
-      default='/tmp/bottleneck',
+      default='Model/bottleneck',
      help='Path to cache bottleneck layer values as files.'
  )
  parser.add_argument(
@ -1235,7 +1334,7 @@ if __name__ == '__main__':
  parser.add_argument(
      '--saved_model_dir',
      type=str,
-      default='../../Model',
+      default='',
      help='Where to save the exported graph.')
  parser.add_argument(
      '--logging_verbosity',
--- a/Model/retrained_graph.pb
+++ b/Model/retrained_graph.pb
--- a/Model/retrained_labels.txt
+++ b/Model/retrained_labels.txt
@ -1,4 +0,0 @@
-glass
-metal
-paper
-plastic
--- a/Model/saved_model.pb
+++ b/Model/saved_model.pb