vtongcoder
diff --git a/‎example-basic/src/example-basic.cpp
Lines changed: 1 addition & 1 deletion b/‎example-basic/src/example-basic.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎example-inception3/src/example-inception3.cpp
Lines changed: 91 additions & 176 deletions b/‎example-inception3/src/example-inception3.cpp
Lines changed: 91 additions & 176 deletions
@@ -18,7 +18,7 @@ class ofApp : public ofBaseApp{
 public:
 
     // main interface to everything tensorflow
-    ofxMSATensorFlow    msa_tf;
+    msa::tf::ofxMSATensorFlow    msa_tf;
 
     // input tensors
     tensorflow::Tensor a, b;
 
@@ -1,8 +1,7 @@
 /*
- * Image recognition using Google's Inception network
+ * Image recognition using Google's Inception v3 network
  * based on https://www.tensorflow.org/versions/master/tutorials/image_recognition/index.html
  *
- *
  * Uses pre-trained model https://storage.googleapis.com/download.tensorflow.org/models/inception_dec_2015.zip
  *
  * openFrameworks code loads and processes pre-trained model (i.e. makes calculations/predictions)
@@ -15,142 +14,38 @@
 #include "ofxMSATensorFlow.h"
 
 
-// input image dimensions dictated by trained model
-#define kInputWidth     299
-#define kInputHeight    299
-#define kInputSize      (kInputWidth * kInputHeight)
-
-
-// we need to normalize the images before feeding into the network
-// from each pixel we subtract the mean and divide by variance
-// this is also dictated by the trained model
-#define kInputMean      (128.0f/255.0f)
-#define kInputStd       (128.0f/255.0f)
-
-// model & labels files to load
-#define kModelPath      "models/tensorflow_inception_graph.pb"
-#define kLabelsPath     "models/imagenet_comp_graph_label_strings.txt"
-
-
-// every node in the network has a name
-// when passing in data to the network, or reading data back, we need to refer to the node by name
-// i.e. 'pass this data to node A', or 'read data back from node X'
-// these node names are specific to the architecture of the model
-#define kInputLayer     "Mul"
-#define kOutputLayer    "softmax"
-
-
-
 //--------------------------------------------------------------
 // ofImage::load() (ie. Freeimage load) doesn't work with TensorFlow! (See README.md)
 // so I have to resort to this awful trick of loading raw image data 299x299 RGB
-static void loadImageRaw(string path, ofImage &img) {
+static void loadImageRaw(string path, ofImage &img, int w, int h) {
     ofFile file(path);
-    img.setFromPixels((unsigned char*)file.readToBuffer().getData(), kInputWidth, kInputHeight, OF_IMAGE_COLOR);
-}
-
-
-
-//--------------------------------------------------------------
-// Takes a file name, and loads a list of labels from it, one per line, and
-// returns a vector of the strings. It pads with empty strings so the length
-// of the result is a multiple of 16, because our model expects that.
-static bool ReadLabelsFile(string file_name, std::vector<string>* result) {
-    std::ifstream file(file_name);
-    if (!file) {
-        ofLogError() <<"ReadLabelsFile: " << file_name << " not found.";
-        return false;
-    }
-
-    result->clear();
-    string line;
-    while (std::getline(file, line)) {
-        result->push_back(line);
-    }
-    const int padding = 16;
-    while (result->size() % padding) {
-        result->emplace_back();
-    }
-    return true;
+    img.setFromPixels((unsigned char*)file.readToBuffer().getData(), w, h, OF_IMAGE_COLOR);
 }
 
 
 
-class ofApp : public ofBaseApp{
+class ofApp : public ofBaseApp {
 public:
 
-    // main interface to everything tensorflow
-    ofxMSATensorFlow    msa_tf;
-
-    // Tensor to hold input image which is fed into the network
-    tensorflow::Tensor image_tensor;
-
-    // vector of Tensors to hold data coming back from the network
-    // (it's a vector of Tensors, because that's how the API works)
-    vector<tensorflow::Tensor> output_tensors;
+    // classifies pixels
+    // check the src of this class (ofxMSATFImageClassifier) to see how to do more generic stuff with ofxMSATensorFlow
+    msa::tf::ImageClassifier classifier;
 
     // for webcam input
     shared_ptr<ofVideoGrabber> video_grabber;
 
-    // contains input image to classify
-    ofImage input_image;
-
-    // normalized float version of input image
-    // keeping texture separate so it's not unnessecarily updated when it isn't needed
-    ofFloatPixels processed_pix;
-    ofTexture processed_tex;
-
-    // contains all labels
-    vector<string> labels;
-
     // folder of images to classify
     ofDirectory image_dir;
 
-    // contains classification information from last classification attempt
-    vector<int> top_label_indices;
-    vector<float> top_scores;
-
-    //---------------------------------------------------------
-    // Load pixels into the network, get the results
-    void classify(ofPixels &pix) {
-        // convert from unsigned char pix to float pix
-        processed_pix = pix;
-
-        // need to resize image to specific dimensions the model is expecting
-        processed_pix.resize(kInputWidth, kInputHeight);
-
-        // pixelwise normalize image by subtracting the mean and dividing by variance (across entire dataset)
-        // I could do this without iterating over the pixels, by setting up a TensorFlow Graph, but I can't be bothered, this is less code
-        float* pix_data = processed_pix.getData();
-        if(!pix_data) {
-            ofLogError() << "Could not classify. pixel data is NULL";
-            return;
-        }
-        for(int i=0; i<kInputSize*3; i++) pix_data[i] = (pix_data[i] - kInputMean) / kInputStd;
-
-        //  make sure opengl texture is updated with new pixel info (needed for correct rendering)
-        processed_tex.loadData(processed_pix);
-
-        // copy data from image into tensorflow's Tensor class
-        ofxMSATensorFlow::pixelsToTensor(processed_pix, image_tensor);
-
-        // feed the data into the network, and request output
-        // output_tensors don't need to be initialized or allocated. they will be filled once the network runs
-        if( !msa_tf.run({ {kInputLayer, image_tensor } }, { kOutputLayer }, {}, &output_tensors) ) {
-            ofLogError() << "Error during running. Check console for details." << endl;
-            return;
-        }
-
-        // the output from the network above is an array of probabilities for every single label
-        // i.e. thousands of probabilities, we only want to the top few
-        ofxMSATensorFlow::getTopScores(output_tensors[0], 6, top_label_indices, top_scores);
-    }
-
+    // top scoring classes
+    vector<int> top_label_indices;  // contains top n label indices for input image
+    vector<float> top_class_probs;  // contains top n probabilities for current input image
 
 
     //--------------------------------------------------------------
     void loadNextImage() {
         static int file_index = 0;
+        ofImage img;
 
         // System load dialog doesn't work with tensorflow :(
         //auto o = ofSystemLoadDialog("Select image");
@@ -160,35 +55,48 @@ class ofApp : public ofBaseApp{
         //img.load("images/fanboy.jpg");
 
         // resorting to awful raw data file load hack!
-        loadImageRaw(image_dir.getPath(file_index), input_image);
-        classify(input_image.getPixels());
+        loadImageRaw(image_dir.getPath(file_index), img, 299, 299);
+
+        classify(img.getPixels());
         file_index = (file_index+1) % image_dir.getFiles().size();
     }
 
 
+    //--------------------------------------------------------------
+    void classify(const ofPixels& pix) {
+        // classify pixels
+        classifier.classify(pix);
+
+        msa::tf::getTopScores(classifier.getOutputTensors()[0], 6, top_label_indices, top_class_probs);
+    }
+
     //--------------------------------------------------------------
     void setup(){
         ofLogNotice() << "Initializing... ";
         ofBackground(0);
         ofSetVerticalSync(true);
-        ofSetFrameRate(60);
+        //        ofSetFrameRate(60);
+
+        // initialize the image classifier, lots of params to setup
+        // these settings are specific to the model
+        msa::tf::ImageClassifier::Settings settings;
+        settings.image_dims = { 299, 299, 3 };
+        settings.itensor_dims = { 1, 299, 299, 3 };
+        settings.model_path = "models/tensorflow_inception_graph.pb";
+        settings.labels_path = "models/imagenet_comp_graph_label_strings.txt";
+        settings.input_layer_name = "Mul";
+        settings.output_layer_name = "softmax";
+        settings.dropout_layer_name = "";
+        settings.varconst_layer_suffix = "_VARHACK";
+        settings.norm_mean = 128.0f/255.0f;
+        settings.norm_stddev = 128.0f/255.0f;
+
+        // initialize classifier with these settings
+        classifier.setup(settings);
 
         // get a list of all images in the 'images' folder
         image_dir.listDir("images");
 
-        // Initialize tensorflow session, return if error
-        if( !msa_tf.setup() ) return;
-
-        // Load graph (i.e. trained model) add to session, return if error
-        if( !msa_tf.loadGraph(kModelPath) ) return;
-
-        // load text file containing labels (i.e. associating classification index with human readable text)
-        if( !ReadLabelsFile(ofToDataPath(kLabelsPath), &labels) ) return;
-
-        // initialize input tensor dimensions
-        // (not sure what the best way to do this was as there isn't an 'init' method, just a constructor)
-        image_tensor = tensorflow::Tensor(tensorflow::DT_FLOAT, tensorflow::TensorShape({ 1, kInputHeight, kInputWidth, 3 }));
-
         // load first image to classify
         loadNextImage();
 
@@ -197,66 +105,69 @@ class ofApp : public ofBaseApp{
 
 
     //--------------------------------------------------------------
-    void update(){
-
+    void update() {
         // if video_grabber active,
         if(video_grabber) {
             // grab frame
             video_grabber->update();
 
             if(video_grabber->isFrameNew()) {
-
-                // update input_image so it's drawn in the right place
-                input_image.setFromPixels(video_grabber->getPixels());
-
                 // send to classification if keypressed
-                if(ofGetKeyPressed(' ')) classify(input_image.getPixels());
+                if(ofGetKeyPressed(' '))
+                    classify(video_grabber->getPixels());
             }
         }
     }
 
+
     //--------------------------------------------------------------
-    void draw(){
-        // draw input image if it's available
-        float x = 0;
-        if(input_image.isAllocated()) {
-            input_image.draw(x, 0);
-            x += input_image.getWidth();
-        }
+    void draw() {
+        if(classifier.isReady()) {
+            ofSetColor(255);
 
-        // draw processed image if it's available
-        if(processed_tex.isAllocated()) {
-            processed_tex.draw(x, 0);
-            x += processed_tex.getWidth();
-        }
+            // if video grabber active, draw in bottom left corner
+            if(video_grabber) video_grabber->draw(0, ofGetHeight() - 240, 320, 240);
 
-        x += 20;
-        float w = ofGetWidth() - 400 - x;
-        float y = 40;
-        float bar_height = 35;
 
-        // iterate top scores and draw them
-        for(int i=0; i<top_scores.size(); i++) {
-            int label_index = top_label_indices[i];
-            string label = labels[label_index];
-            float p = top_scores[i];    // the score (i.e. probability, 0...1)
+            float x = 0;
 
-            // draw full bar
-            ofSetColor(ofLerp(50.0, 255.0, p), ofLerp(100.0, 0.0, p), ofLerp(150.0, 0.0, p));
-            ofDrawRectangle(x, y, w * p, bar_height);
-            ofSetColor(40);
+            // draw input image
+            classifier.getInputImage().draw(x, 0);
+            x += classifier.getInputImage().getWidth();
 
-            // draw outline
-            ofNoFill();
-            ofDrawRectangle(x, y, w, bar_height);
-            ofFill();
+            // draw processed image
+            classifier.getProcessedImage().draw(x, 0);
+            x += classifier.getProcessedImage().getWidth();
 
-            // draw text
-            ofSetColor(255);
-            ofDrawBitmapString(label + " (" + ofToString(label_index) + "): " + ofToString(p,4), x + w + 10, y + 20);
-            y += bar_height + 5;
-        }
+            x += 20;
+
+            float w = ofGetWidth() - 400 - x;
+            float y = 40;
+            float bar_height = 35;
+
+
+            // iterate top scores and draw them
+            for(int i=0; i<top_class_probs.size(); i++) {
+                int label_index = top_label_indices[i];
+                string label = classifier.getLabels()[label_index];
+                float p = top_class_probs[i];    // the score (i.e. probability, 0...1)
 
+                // draw full bar
+                ofSetColor(ofLerp(50.0, 255.0, p), ofLerp(100.0, 0.0, p), ofLerp(150.0, 0.0, p));
+                ofDrawRectangle(x, y, w * p, bar_height);
+                ofSetColor(40);
+
+                // draw outline
+                ofNoFill();
+                ofDrawRectangle(x, y, w, bar_height);
+                ofFill();
+
+                // draw text
+                ofSetColor(255);
+                ofDrawBitmapString(label + " (" + ofToString(label_index) + "): " + ofToString(p,4), x + w + 10, y + 20);
+                y += bar_height + 5;
+            }
+        }
 
         ofSetColor(255);
         ofDrawBitmapString(ofToString(ofGetFrameRate()), ofGetWidth() - 100, 30);
@@ -265,7 +176,7 @@ class ofApp : public ofBaseApp{
         str_inst << "'l' to load image\n";
         str_inst << "or drag an image (must be raw, 299x299) onto the window\n";
         str_inst << "'v' to toggle video input";
-        ofDrawBitmapString(str_inst.str(), 15, input_image.getHeight() + 30);
+        ofDrawBitmapString(str_inst.str(), 15, classifier.getHeight() + 30);
     }
 
 
@@ -291,14 +202,18 @@ class ofApp : public ofBaseApp{
     void dragEvent(ofDragInfo dragInfo){
         if(dragInfo.files.empty()) return;
 
+        ofImage img;
+
         string filePath = dragInfo.files[0];
         //img.load(filePath);  // FreeImage doesn't work :(
-        loadImageRaw(filePath, input_image);
-        classify(input_image.getPixels());
+        loadImageRaw(filePath, img, 299, 299);
+        classify(img.getPixels());
     }
 
 };
 
+
+
 //========================================================================
 int main( ){
     ofSetupOpenGL(1200, 800, OF_WINDOW);			// <-------- setup the GL context