Adding grayscale classification

carlyrichmond · carlyrichmond · commit 12860c44c0bb · 2025-06-27T12:04:44.000+01:00
diff --git a/README.md b/README.md
@@ -79,6 +79,7 @@ nvm use v22.1.0
 
 node scripts/classify-images.js
 node scripts/custom-model.js
+node scripts/grayscale-custom-model.js
 node scripts/transfer-learning.js
 ```
 
@@ -128,5 +129,12 @@ Thanks go to the fantastic bakers out there making hyper-realistic cakes that in
 5. https://www.thesugardreams.net
 6. https://juliemcallistercakes.com
 7. https://www.thesweetstopofrva.com
+8. https://apriljulian.com/portfolio
+9. https://cakeyall.com/
+10. https://www.layerscakestudio.com/
+11. https://www.apinchofspirit.com/gallery
+12. https://www.mycakebuds.com
+13. https://mannandcobakeshop.com/
+14. https://www.thesculptedslice.com/
 
 Thanks also to [Unsplash](https://unsplash.com/) and their amazing contributors who allowed me to find non-cake images through the [JavaScript wrapper unsplash-js](https://www.npmjs.com/package/unsplash-js) of the [Unsplash API](https://unsplash.com/documentation). 
diff --git a/cake-game/src/components/classifier-table-row/ClassifierTableRow.jsx b/cake-game/src/components/classifier-table-row/ClassifierTableRow.jsx
@@ -39,6 +39,7 @@ function ClassifierTableRow(props) {
         <th className="classification">{ formatClassificationCollections(props.result.models?.coco_ssd_predictions, 'class') }</th>
         <th className="classification">{ formatClassificationString(props.result.models?.my_transfer_model_classifier?.category) }</th>
         <th className="classification">{ formatClassificationString(props.result.models?.my_model_classifier.category) }</th>
+        <th className="classification">{ formatClassificationString(props.result.models?.my_grayscale_model_classifier?.category) }</th>
       </tr>
     </>
   );
diff --git a/cake-game/src/functions/game_results.js b/cake-game/src/functions/game_results.js
@@ -17,6 +17,8 @@ export async function handler(event, context) {
       return document._source;
     });
 
+    // console.log(`RESULTS: ${results}`)
+
     return generateResponse(200, results);
   } catch (e) {
     console.log(e);
diff --git a/cake-game/src/routes/end/End.jsx b/cake-game/src/routes/end/End.jsx
@@ -73,6 +73,7 @@ function End() {
                 <th>COCO-SSD</th>
                 <th>MobileNet Transfer Classifier</th>
                 <th>Carly Model</th>
+                <th>Carly Model (Grayscale)</th>
               </tr>
             </thead>
             <tbody>
diff --git a/model-classification-app/scripts/cake-image-urls.json b/model-classification-app/scripts/cake-image-urls.json
diff --git a/model-classification-app/scripts/cake-sites.json b/model-classification-app/scripts/cake-sites.json
@@ -34,5 +34,41 @@
     {
         "url": "https://www.thesweetstopofrva.com/weddingcakes",
         "category": "cake"  
+    },
+    {
+        "url": "https://apriljulian.com/portfolio",
+        "category": "cake"  
+    },
+    {
+        "url": "https://cakeyall.com/pages/info",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.layerscakestudio.com/",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.apinchofspirit.com/gallery",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.mycakebuds.com/products",
+        "category": "cake"  
+    },
+    {
+        "url": "https://mannandcobakeshop.com/pages/custom-cake",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.thesculptedslice.com/gallery-home/celebration-cakes",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.thesculptedslice.com/gallery-home/sculpted-cakes",
+        "category": "cake"  
+    },
+    {
+        "url": "https://www.thesculptedslice.com/gallery-home/wedding-cakes",
+        "category": "cake"  
     }
 ]
diff --git a/model-classification-app/scripts/classify-images.js b/model-classification-app/scripts/classify-images.js
@@ -40,9 +40,9 @@ async function run() {
   // Reset index (uncomment if regenerating)
   //await clearIndex();
 
-  /*await getCakeImages();
-  const cakeImageUrls = loadCakeImageUrls();
-  await classifyImages('cake', cakeImageUrls);*/
+  //await getCakeImages();
+  //const cakeImageUrls = loadCakeImageUrls();
+  //await classifyImages('cake', cakeImageUrls);
 
   const objectImageUrls = await getUnsplashImageUrls();
   await classifyImages("not cake", objectImageUrls);
@@ -65,7 +65,7 @@ async function getCakeImages() {
     try {
       await page.goto(site.url);
       const currentPageImages = await page
-        .locator("img")
+        .getByRole("img")
         .evaluateAll((images) => {
           return images
             .map((image) => {
diff --git a/model-classification-app/scripts/elasticsearch-util.js b/model-classification-app/scripts/elasticsearch-util.js
@@ -85,6 +85,29 @@ async function updateDocumentWithClassification(documentId, category, prediction
   }
 }
 
+async function updateDocumentWithGrayscaleClassification(documentId, category, predictions) {
+  const myGrayscaleModelClassifier = { 
+    category:  category,
+    predictions: predictions
+  };
+  try {
+    const response = await esClient.update(
+      {
+        index: index,
+        id: documentId,
+        script: {
+          lang: 'painless',
+          source: `ctx._source.my_grayscale_model_classifier = params.classification`,
+          params: { classification: myGrayscaleModelClassifier }
+        }
+      }
+    );
+    console.log(response);
+  } catch(e) {
+    console.log(e);
+  }
+}
+
 async function updateDocumentWithTransferClassification(documentId, category, predictions) {
   const myModelClassifier = { 
     category:  category,
@@ -107,4 +130,4 @@ async function updateDocumentWithTransferClassification(documentId, category, pr
   }
 }
 
-module.exports = { esClient, clearIndex, addClassifiersToIndex, getAllImages, getFirstNImagesByCategory, updateDocumentWithClassification, updateDocumentWithTransferClassification };
+module.exports = { esClient, clearIndex, addClassifiersToIndex, getAllImages, getFirstNImagesByCategory, updateDocumentWithClassification, updateDocumentWithGrayscaleClassification, updateDocumentWithTransferClassification };
diff --git a/model-classification-app/scripts/grayscale-custom-model.js b/model-classification-app/scripts/grayscale-custom-model.js
@@ -0,0 +1,168 @@
+const tf = require("@tensorflow/tfjs-node");
+
+const {
+  getAllImages,
+  getFirstNImagesByCategory,
+  updateDocumentWithGrayscaleClassification,
+} = require("./elasticsearch-util");
+const { getGrayscaleImageTensor, getGrayscaleTensorsForImageSet, IMAGE_HEIGHT, IMAGE_WIDTH } = require("./tf-util");
+
+const CLASS_NAMES = ["cake", "not cake"];
+
+// Build custom model
+run();
+
+async function run() {
+  // Get a subset of the cake images
+  const cakesResponse = await getFirstNImagesByCategory(CLASS_NAMES[0], 50);
+  const cakeTensors = await getGrayscaleTensorsForImageSet(cakesResponse);
+
+  // Get a subset of the unsplash images for not cake images
+  const notCakesResponse = await getFirstNImagesByCategory(CLASS_NAMES[1], 50);
+  const notCakeTensors = await getGrayscaleTensorsForImageSet(notCakesResponse);
+
+  const images = cakeTensors.concat(notCakeTensors);
+  const labels = Array.from({ length: cakeTensors.length })
+    .fill([1, 0])
+    .concat(Array.from({ length: notCakeTensors.length }).fill([0, 1]));
+
+  tf.util.shuffleCombo(images, labels);
+  const singleImageTensor = tf.stack(images);
+  const labelsTensor = tf.tensor2d(labels);
+
+  const model = createModel();
+
+  const BATCH_SIZE = 32;
+  const NUM_EPOCHS = 10;
+
+  await model.fit(singleImageTensor, labelsTensor, {
+    batchSize: BATCH_SIZE, // Number of samples to work through before updating the internal model parameters
+    epochs: NUM_EPOCHS, // Number of passes through the dataset
+    shuffle: true, // Shuffle data before each pass
+  });
+
+  // Classify images
+  await classifyAllImages(model);
+
+  // Optional saving of model
+  const MODEL_DIR = "./model";
+
+  await model.save(`file://${MODEL_DIR}`);
+
+  // Tidy up
+  singleImageTensor.dispose();
+  labelsTensor.dispose();
+  tf.dispose(cakeTensors);
+  tf.dispose(notCakeTensors);
+
+  console.log('Classification complete!');
+}
+
+/* Functional implementation */
+// Convolutional Neural Network (CNN) example
+function createModel() {
+  const model = tf.sequential();
+
+  /* Creates a 2d convolution layer. 
+  * Concept from computer vision where a filter (or kernel or matrix) is applied and moves 
+  through the image by the specified strides to identify features of interest in the image 
+  See https://www.kaggle.com/discussions/general/463431
+  */
+  model.add(
+    tf.layers.conv2d({
+      inputShape: [IMAGE_WIDTH, IMAGE_HEIGHT, 1], // 1 = Grayscale
+      filters: 16, // dimensions of the output space
+      kernelSize: 3, // 3x3 matrix
+      activation: "relu", //f(x)=max(0,x)
+    })
+  );
+
+  /* Max pooling reduces the dimensionality of images by reducing the number of pixels in the output from the 
+   * previous convolutional layer.
+   * Used to reduce computational load going forward and reduce overfitting
+   * See https://deeplizard.com/learn/video/ZjM_XQa5s6s
+  */
+  model.add(
+    tf.layers.maxPooling2d({
+      poolSize: 2,
+      strides: 2,
+    })
+  );
+
+  model.add(
+    tf.layers.conv2d({
+      filters: 32,
+      kernelSize: 3,
+      activation: "relu",
+    })
+  );
+
+  model.add(
+    tf.layers.maxPooling2d({
+      poolSize: 2,
+      strides: 2,
+    })
+  );
+
+  // Flattens the inputs to 1D, making the outputs 2D
+  model.add(tf.layers.flatten());
+
+  /* Dense Layer is simple layer of neurons in which each neuron receives input from all the neurons of previous layer, 
+   * thus called as dense. Dense Layer is used to classify image based on output from convolutional layers. 
+   see https://towardsdatascience.com/introduction-to-convolutional-neural-network-cnn-de*/
+  model.add(
+    tf.layers.dense({
+      units: 64,
+      activation: "relu",
+    })
+  );
+
+  model.add(
+    tf.layers.dense({
+      units: CLASS_NAMES.length,
+      activation: "softmax", // turns a vector of K real values into a vector of K real values that sum to 1
+    })
+  );
+
+  model.compile({
+    optimizer: tf.train.adam(), // Stochastic Optimization method
+    loss: "binaryCrossentropy",
+    metrics: ["accuracy"],
+  });
+
+  return model;
+}
+
+async function classifyAllImages(model) {
+  const imagesResponse = await getAllImages();
+  const images = imagesResponse.hits.hits.flatMap((result) => {
+    return { id: result._id, url: result._source.image_url };
+  });
+
+  for (image of images) {
+    console.log(image.url);
+    const tensor = await getGrayscaleImageTensor(image.url);
+    const results = await model.predict(tensor.expandDims()).data();
+
+    const predictions = Array.from(results)
+      .map(function (p, i) {
+        return {
+          probability: p,
+          className: CLASS_NAMES[i], // we are selecting the value from the obj
+        };
+      })
+      .sort(function (a, b) {
+        return b.probability - a.probability;
+      })
+      .slice(0, 2);
+
+    console.log(predictions);
+    updateDocumentWithGrayscaleClassification(
+      image.id,
+      predictions[0].className,
+      predictions
+    );
+
+    tensor.dispose();
+  }
+}
diff --git a/model-classification-app/scripts/tf-util.js b/model-classification-app/scripts/tf-util.js
@@ -42,6 +42,16 @@ async function getTensorFromImage(imageUrl) {
   
     return tensors;
   }
+
+  async function getGrayscaleTensorsForImageSet(results) {
+    let tensors = [];
+    for (result of results.hits.hits) {
+      const features = await getGrayscaleImageTensor(result._source.image_url);
+      tensors.push(features);
+    }
+  
+    return tensors;
+  }
   
   async function getResizedImageTensor(imageUrl) {
     const decodedImage = await getTensorFromImage(imageUrl);
@@ -52,4 +62,15 @@ async function getTensorFromImage(imageUrl) {
     return resizedImage;
   }
 
-module.exports = { getResizedImageTensor, getTensorFromImage, getTensorsForImageSet, IMAGE_HEIGHT, IMAGE_WIDTH };
+  async function getGrayscaleImageTensor(imageUrl) {
+    const decodedImage = await getTensorFromImage(imageUrl);
+    const resizedImage = tf.image.resizeBilinear(decodedImage, [
+      IMAGE_WIDTH,
+      IMAGE_HEIGHT
+    ], true)
+    const grayscaleImage = tf.image.rgbToGrayscale(resizedImage);
+    
+    return grayscaleImage;
+  }
+
+module.exports = { getGrayscaleImageTensor, getResizedImageTensor, getTensorFromImage, getTensorsForImageSet, getGrayscaleTensorsForImageSet, IMAGE_HEIGHT, IMAGE_WIDTH };
diff --git a/model-classification-app/scripts/unsplash-util.js b/model-classification-app/scripts/unsplash-util.js
@@ -5,7 +5,7 @@ const unsplash = createApi({
   accessKey: process.env.UNSPLASH_ACCESS_KEY
 });
 
-const queries = [ "cup", "vase", "candle", "bottle", "plate", "tray", "thimble", "flowerpot", "dog", "cat", "hat", "book", "food", "reptile", "toy", "shoe", "bag", "purse" ];
+const queries = [ "cup", "vase", "candle", "bottle", "plate", "tray", "thimble", "flowerpot", "dog", "cat", "hat", "book", "food", "reptile", "toy", "shoe", "bag", "purse", "guitars", "cars", "burgers", "cleaning products", "lizards", "football", "pineapple", "oranges", "teddy", "cheese", "game boy" ];
 
 async function getUnsplashImageUrls() {