Add script for classifying images, update gitignore.

2019-05-06 02:58:26 +02:00 · 2019-05-06 02:58:26 +02:00 · 0713f42692
commit 0713f42692
parent dfa0d87971
57 changed files with 290 additions and 14 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,4 +1,8 @@
-.vscode/*
+.vscode/
-*/__pycache__/*
+*/__pycache__/
 *tex
-Images/TrainingImages/*
+Images/TrainingImages/
 Model/bottleneck/
 Model/retrain_logs/
 Model/variables/
 Model/*.pb_log/
--- a/Images/TestImages/glass1.jpg
+++ b/Images/TestImages/glass1.jpg
--- a/Images/TestImages/glass100.jpg
+++ b/Images/TestImages/glass100.jpg
--- a/Images/TestImages/glass110.jpg
+++ b/Images/TestImages/glass110.jpg
--- a/Images/TestImages/glass113.jpg
+++ b/Images/TestImages/glass113.jpg
--- a/Images/TestImages/glass116.jpg
+++ b/Images/TestImages/glass116.jpg
--- a/Images/TestImages/glass122.jpg
+++ b/Images/TestImages/glass122.jpg
--- a/Images/TestImages/glass126.jpg
+++ b/Images/TestImages/glass126.jpg
--- a/Images/TestImages/glass156.jpg
+++ b/Images/TestImages/glass156.jpg
--- a/Images/TestImages/glass42.jpg
+++ b/Images/TestImages/glass42.jpg
--- a/Images/TestImages/glass43.jpg
+++ b/Images/TestImages/glass43.jpg
--- a/Images/TestImages/glass44.jpg
+++ b/Images/TestImages/glass44.jpg
--- a/Images/TestImages/glass46.jpg
+++ b/Images/TestImages/glass46.jpg
--- a/Images/TestImages/glass55.jpg
+++ b/Images/TestImages/glass55.jpg
--- a/Images/TestImages/glass59.jpg
+++ b/Images/TestImages/glass59.jpg
--- a/Images/TestImages/metal112.jpg
+++ b/Images/TestImages/metal112.jpg
--- a/Images/TestImages/metal20.jpg
+++ b/Images/TestImages/metal20.jpg
--- a/Images/TestImages/metal24.jpg
+++ b/Images/TestImages/metal24.jpg
--- a/Images/TestImages/metal27.jpg
+++ b/Images/TestImages/metal27.jpg
--- a/Images/TestImages/metal29.jpg
+++ b/Images/TestImages/metal29.jpg
--- a/Images/TestImages/metal31.jpg
+++ b/Images/TestImages/metal31.jpg
--- a/Images/TestImages/metal33.jpg
+++ b/Images/TestImages/metal33.jpg
--- a/Images/TestImages/metal50.jpg
+++ b/Images/TestImages/metal50.jpg
--- a/Images/TestImages/metal54.jpg
+++ b/Images/TestImages/metal54.jpg
--- a/Images/TestImages/metal86.jpg
+++ b/Images/TestImages/metal86.jpg
--- a/Images/TestImages/metal89.jpg
+++ b/Images/TestImages/metal89.jpg
--- a/Images/TestImages/metal94.jpg
+++ b/Images/TestImages/metal94.jpg
--- a/Images/TestImages/paper102.jpg
+++ b/Images/TestImages/paper102.jpg
--- a/Images/TestImages/paper111.jpg
+++ b/Images/TestImages/paper111.jpg
--- a/Images/TestImages/paper113.jpg
+++ b/Images/TestImages/paper113.jpg
--- a/Images/TestImages/paper118.jpg
+++ b/Images/TestImages/paper118.jpg
--- a/Images/TestImages/paper16.jpg
+++ b/Images/TestImages/paper16.jpg
--- a/Images/TestImages/paper20.jpg
+++ b/Images/TestImages/paper20.jpg
--- a/Images/TestImages/paper35.jpg
+++ b/Images/TestImages/paper35.jpg
--- a/Images/TestImages/paper46.jpg
+++ b/Images/TestImages/paper46.jpg
--- a/Images/TestImages/paper52.jpg
+++ b/Images/TestImages/paper52.jpg
--- a/Images/TestImages/paper56.jpg
+++ b/Images/TestImages/paper56.jpg
--- a/Images/TestImages/paper71.jpg
+++ b/Images/TestImages/paper71.jpg
--- a/Images/TestImages/paper72.jpg
+++ b/Images/TestImages/paper72.jpg
--- a/Images/TestImages/paper76.jpg
+++ b/Images/TestImages/paper76.jpg
--- a/Images/TestImages/paper94.jpg
+++ b/Images/TestImages/paper94.jpg
--- a/Images/TestImages/plastic1.jpg
+++ b/Images/TestImages/plastic1.jpg
--- a/Images/TestImages/plastic20.jpg
+++ b/Images/TestImages/plastic20.jpg
--- a/Images/TestImages/plastic32.jpg
+++ b/Images/TestImages/plastic32.jpg
--- a/Images/TestImages/plastic57.jpg
+++ b/Images/TestImages/plastic57.jpg
--- a/Images/TestImages/plastic73.jpg
+++ b/Images/TestImages/plastic73.jpg
--- a/Images/TestImages/plastic77.jpg
+++ b/Images/TestImages/plastic77.jpg
--- a/Images/TestImages/plastic78.jpg
+++ b/Images/TestImages/plastic78.jpg
--- a/Images/TestImages/plastic85.jpg
+++ b/Images/TestImages/plastic85.jpg
--- a/Images/TestImages/plastic91.jpg
+++ b/Images/TestImages/plastic91.jpg
--- a/Images/TestImages/plastic98.jpg
+++ b/Images/TestImages/plastic98.jpg
--- a/Logic/TrashRecognition/ImageClassification.py
+++ b/Logic/TrashRecognition/ImageClassification.py
@ -1 +1,156 @@
-import tensorflow as tf
+# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 import argparse
 import os
 import numpy as np
 import tensorflow as tf
 def load_graph(model_file):
  graph = tf.Graph()
  graph_def = tf.GraphDef()
  with open(model_file, "rb") as f:
    graph_def.ParseFromString(f.read())
  with graph.as_default():
    tf.import_graph_def(graph_def)
  return graph
 def read_tensor_from_image_file(file_name,
                                input_height=299,
                                input_width=299,
                                input_mean=0,
                                input_std=255):
  input_name = "file_reader"
  output_name = "normalized"
  file_reader = tf.read_file(file_name, input_name)
  if file_name.endswith(".png"):
    image_reader = tf.image.decode_png(
        file_reader, channels=3, name="png_reader")
  elif file_name.endswith(".gif"):
    image_reader = tf.squeeze(
        tf.image.decode_gif(file_reader, name="gif_reader"))
  elif file_name.endswith(".bmp"):
    image_reader = tf.image.decode_bmp(file_reader, name="bmp_reader")
  else:
    image_reader = tf.image.decode_jpeg(
        file_reader, channels=3, name="jpeg_reader")
  float_caster = tf.cast(image_reader, tf.float32)
  dims_expander = tf.expand_dims(float_caster, 0)
  resized = tf.image.resize_bilinear(dims_expander, [input_height, input_width])
  normalized = tf.divide(tf.subtract(resized, [input_mean]), [input_std])
  sess = tf.Session()
  result = sess.run(normalized)
  return result
 def load_labels(label_file):
  label = []
  proto_as_ascii_lines = tf.gfile.GFile(label_file).readlines()
  for l in proto_as_ascii_lines:
    label.append(l.rstrip())
  return label
 if __name__ == "__main__":
  model_file = "Model/retrained_graph.pb"
  label_file = "Model/retrained_labels.txt"
  input_height = 299
  input_width = 299
  input_mean = 128
  input_std = 128
  input_layer = "input"
  output_layer = "InceptionV3/Predictions/Reshape_1"
  parser = argparse.ArgumentParser()
  parser.add_argument("--graph",
   default="Model/retrained_graph.pb",
   help="graph/model to be executed")
  parser.add_argument("--labels",
   default="Model/retrained_labels.txt",
   help="name of file containing labels")
  parser.add_argument("--input_height", type=int, help="input height")
  parser.add_argument("--input_width", type=int, help="input width")
  parser.add_argument("--input_mean", type=int, help="input mean")
  parser.add_argument("--input_std", type=int, help="input std")
  parser.add_argument("--input_layer",
   default="Placeholder",
    help="name of input layer")
  parser.add_argument("--output_layer",
   default="final_result",
   help="name of output layer")
  args = parser.parse_args()
  if args.graph:
    model_file = args.graph
  if args.labels:
    label_file = args.labels
  if args.input_height:
    input_height = args.input_height
  if args.input_width:
    input_width = args.input_width
  if args.input_mean:
    input_mean = args.input_mean
  if args.input_std:
    input_std = args.input_std
  if args.input_layer:
    input_layer = args.input_layer
  if args.output_layer:
    output_layer = args.output_layer
  graph = load_graph(model_file)
  for filename in os.listdir('Images/TestImages'):
    t = read_tensor_from_image_file(
      f'Images/TestImages/{filename}',
      input_height=input_height,
      input_width=input_width,
      input_mean=input_mean,
      input_std=input_std)
    input_name = "import/" + input_layer
    output_name = "import/" + output_layer
    input_operation = graph.get_operation_by_name(input_name)
    output_operation = graph.get_operation_by_name(output_name)
    with tf.Session(graph=graph) as sess:
      results = sess.run(output_operation.outputs[0], {
          input_operation.outputs[0]: t
      })
    results = np.squeeze(results)
    top_k = results.argsort()[-5:][::-1]
    labels = load_labels(label_file)
    print(f'{filename}: {labels[top_k[0]]} with {results[top_k[0]] * 100}% certainity')
    # for i in top_k:
    #   print(labels[i], results[i])
--- a/Logic/TrashRecognition/LoadGraphToTB.py
+++ b/Logic/TrashRecognition/LoadGraphToTB.py
@ -0,0 +1,22 @@
 import tensorflow as tf
 from tensorflow.python.platform import gfile
 import os
 def load_pb_to_log(filename):
    with tf.Session() as sess:
        with gfile.FastGFile(filename, 'rb') as f:
            graph_def = tf.GraphDef()
            graph_def.ParseFromString(f.read())
            g_in = tf.import_graph_def(graph_def)
    LOGDIR = f'{filename}_log'
    train_writer = tf.summary.FileWriter(LOGDIR)
    train_writer.add_graph(sess.graph)
 def main():
    for filename in os.listdir('Model'):
        fname, fext = os.path.splitext(filename)
        if fext == '.pb':
            load_pb_to_log(f'Model/{filename}')
 if __name__ == "__main__":
    main()
--- a/Logic/TrashRecognition/Retrain.py
+++ b/Logic/TrashRecognition/Retrain.py
@ -15,6 +15,105 @@
 # NOTICE: This work was derived from tensorflow/examples/image_retraining
 # and modified to use TensorFlow Hub modules.
 # pylint: disable=line-too-long
 r"""Simple transfer learning with image modules from TensorFlow Hub.
 This example shows how to train an image classifier based on any
 TensorFlow Hub module that computes image feature vectors. By default,
 it uses the feature vectors computed by Inception V3 trained on ImageNet.
 For more options, search https://tfhub.dev for image feature vector modules.
 The top layer receives as input a 2048-dimensional vector (assuming
 Inception V3) for each image. We train a softmax layer on top of this
 representation. If the softmax layer contains N labels, this corresponds
 to learning N + 2048*N model parameters for the biases and weights.
 Here's an example, which assumes you have a folder containing class-named
 subfolders, each full of images for each label. The example folder flower_photos
 should have a structure like this:
 ~/flower_photos/daisy/photo1.jpg
 ~/flower_photos/daisy/photo2.jpg
 ...
 ~/flower_photos/rose/anotherphoto77.jpg
 ...
 ~/flower_photos/sunflower/somepicture.jpg
 The subfolder names are important, since they define what label is applied to
 each image, but the filenames themselves don't matter. (For a working example,
 download http://download.tensorflow.org/example_images/flower_photos.tgz
 and run  tar xzf flower_photos.tgz  to unpack it.)
 Once your images are prepared, and you have pip-installed tensorflow-hub and
 a sufficiently recent version of tensorflow, you can run the training with a
 command like this:
 ```bash
 python retrain.py --image_dir ~/flower_photos
 ```
 You can replace the image_dir argument with any folder containing subfolders of
 images. The label for each image is taken from the name of the subfolder it's
 in.
 This produces a new model file that can be loaded and run by any TensorFlow
 program, for example the tensorflow/examples/label_image sample code.
 By default this script will use the highly accurate, but comparatively large and
 slow Inception V3 model architecture. It's recommended that you start with this
 to validate that you have gathered good training data, but if you want to deploy
 on resource-limited platforms, you can try the `--tfhub_module` flag with a
 Mobilenet model. For more information on Mobilenet, see
 https://research.googleblog.com/2017/06/mobilenets-open-source-models-for.html
 For example:
 Run floating-point version of Mobilenet:
 ```bash
 python retrain.py --image_dir ~/flower_photos \
    --tfhub_module https://tfhub.dev/google/imagenet/mobilenet_v1_100_224/feature_vector/1
 ```
 Run Mobilenet, instrumented for quantization:
 ```bash
 python retrain.py --image_dir ~/flower_photos/ \
    --tfhub_module https://tfhub.dev/google/imagenet/mobilenet_v1_100_224/quantops/feature_vector/1
 ```
 These instrumented models can be converted to fully quantized mobile models via
 TensorFlow Lite.
 There are different Mobilenet models to choose from, with a variety of file
 size and latency options.
  - The first number can be '100', '075', '050', or '025' to control the number
    of neurons (activations of hidden layers); the number of weights (and hence
    to some extent the file size and speed) shrinks with the square of that
    fraction.
  - The second number is the input image size. You can choose '224', '192',
    '160', or '128', with smaller sizes giving faster speeds.
 To use with TensorBoard:
 By default, this script will log summaries to /tmp/retrain_logs directory
 Visualize the summaries with this command:
 tensorboard --logdir /tmp/retrain_logs
 To use with Tensorflow Serving, run this tool with --saved_model_dir set
 to some increasingly numbered export location under the model base path, e.g.:
 ```bash
 python retrain.py (... other args as before ...) \
    --saved_model_dir=/tmp/saved_models/$(date +%s)/
 tensorflow_model_server --port=9000 --model_name=my_image_classifier \
    --model_base_path=/tmp/saved_models/
 ```
 """
 # pylint: enable=line-too-long
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
@ -1070,13 +1169,13 @@ if __name__ == '__main__':
  parser.add_argument(
      '--image_dir',
      type=str,
-      default='../../Images/TrainingImages',
+      default='Images/TrainingImages',
      help='Path to folders of labeled images.'
  )
  parser.add_argument(
      '--output_graph',
      type=str,
-      default='../../Model/retrained_graph.pb',
+      default='Model/output_graph.pb',
      help='Where to save the trained graph.'
  )
  parser.add_argument(
@ -1097,13 +1196,13 @@ if __name__ == '__main__':
  parser.add_argument(
      '--output_labels',
      type=str,
-      default='../../Model/retrained_labels.txt',
+      default='Model/output_labels.txt',
      help='Where to save the trained graph\'s labels.'
  )
  parser.add_argument(
      '--summaries_dir',
      type=str,
-      default='/retrain_logs',
+      default='Model/retrain_logs',
      help='Where to save summary logs for TensorBoard.'
  )
  parser.add_argument(
@ -1177,7 +1276,7 @@ if __name__ == '__main__':
  parser.add_argument(
      '--bottleneck_dir',
      type=str,
-      default='/tmp/bottleneck',
+      default='Model/bottleneck',
      help='Path to cache bottleneck layer values as files.'
  )
  parser.add_argument(
@ -1235,7 +1334,7 @@ if __name__ == '__main__':
  parser.add_argument(
      '--saved_model_dir',
      type=str,
-      default='../../Model',
+      default='',
      help='Where to save the exported graph.')
  parser.add_argument(
      '--logging_verbosity',
--- a/Model/retrained_graph.pb
+++ b/Model/retrained_graph.pb
--- a/Model/retrained_labels.txt
+++ b/Model/retrained_labels.txt
@ -1,4 +0,0 @@
 glass
 metal
 paper
 plastic
--- a/Model/saved_model.pb
+++ b/Model/saved_model.pb