No public description

tensorflower-gardener · tensorflower-gardener · commit 511bb82f5da0 · 2025-05-09T14:24:15.000-07:00
PiperOrigin-RevId: 756905799
diff --git a/official/projects/waste_identification_ml/Triton_TF_Cloud_Deployment/client/utils.py b/official/projects/waste_identification_ml/Triton_TF_Cloud_Deployment/client/utils.py
@@ -0,0 +1,111 @@
+# Copyright 2024 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Utility functions for the pipeline."""
+
+from collections.abc import Mapping, Sequence
+import csv
+import os
+from typing import TypedDict
+import natsort
+
+
+class ItemDict(TypedDict):
+  id: int
+  name: str
+  supercategory: str
+
+
+def _read_csv_to_list(file_path: str) -> Sequence[str]:
+  """Reads a CSV file and returns its contents as a list.
+
+  This function reads the given CSV file, skips the header, and assumes
+  there is only one column in the CSV. It returns the contents as a list of
+  strings.
+
+  Args:
+      file_path: The path to the CSV file.
+
+  Returns:
+      The contents of the CSV file as a list of strings.
+  """
+  data_list = []
+  with open(file_path, 'r') as csvfile:
+    reader = csv.reader(csvfile)
+    for row in reader:
+      data_list.append(row[0])  # Assuming there is only one column in the CSV
+  return data_list
+
+
+def _categories_dictionary(objects: Sequence[str]) -> Mapping[int, ItemDict]:
+  """This function takes a list of objects and returns a dictionaries.
+
+  A dictionary of objects, where each object is represented by a dictionary
+  with the following keys:
+    - id: The ID of the object.
+    - name: The name of the object.
+    - supercategory: The supercategory of the object.
+
+  Args:
+    objects: A list of strings, where each string is the name of an object.
+
+  Returns:
+    A tuple of two dictionaries, as described above.
+  """
+  category_index = {}
+
+  for num, obj_name in enumerate(objects, start=1):
+    obj_dict = {'id': num, 'name': obj_name, 'supercategory': 'objects'}
+    category_index[num] = obj_dict
+  return category_index
+
+
+def load_labels(
+    labels_path: str,
+) -> tuple[Sequence[str], Mapping[int, ItemDict]]:
+  """Loads labels from a CSV file and generates category mappings.
+
+  Args:
+      labels_path: Path to the CSV file containing label definitions.
+
+  Returns:
+    category_indices: A list of category indices.
+    category_index: A dictionary mapping category indices to ItemDict objects.
+  """
+  category_indices = _read_csv_to_list(labels_path)
+  category_index = _categories_dictionary(category_indices)
+  return category_indices, category_index
+
+
+def files_paths(folder_path):
+  """List the full paths of image files in a folder and sort them.
+
+  Args:
+    folder_path: The path of the folder to list the image files from.
+
+  Returns:
+    A list of full paths of the image files in the folder, sorted in ascending
+    order.
+  """
+  img_extensions = ('.jpg', '.jpeg', '.png', '.gif', '.bmp', '.tiff', '.webp')
+  image_files_full_path = []
+
+  for entry in os.scandir(folder_path):
+    if entry.is_file() and entry.name.lower().endswith(img_extensions):
+      image_files_full_path.append(entry.path)
+
+  # Sort the list of files by name
+  image_files_full_path = natsort.natsorted(image_files_full_path)
+
+  return image_files_full_path
diff --git a/official/projects/waste_identification_ml/Triton_TF_Cloud_Deployment/client/utils_test.py b/official/projects/waste_identification_ml/Triton_TF_Cloud_Deployment/client/utils_test.py
@@ -0,0 +1,86 @@
+# Copyright 2024 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import tempfile
+import unittest
+from official.projects.waste_identification_ml.Triton_TF_Cloud_Deployment.client import utils
+
+
+class TestLoadLabels(unittest.TestCase):
+
+  def test_load_labels(self):
+    # Create a temporary CSV file within the test
+    with tempfile.NamedTemporaryFile(mode='w+', delete=False) as temp_csv:
+      temp_csv.write('Label\nBottle\nCan\nCup\n')
+      temp_csv_path = temp_csv.name
+
+    try:
+      # Call the function under test
+      category_indices, category_index = utils.load_labels(temp_csv_path)
+
+      # Expected results
+      expected_list = ['Label', 'Bottle', 'Can', 'Cup']
+      expected_dict = {
+          1: {'id': 1, 'name': 'Label', 'supercategory': 'objects'},
+          2: {'id': 2, 'name': 'Bottle', 'supercategory': 'objects'},
+          3: {'id': 3, 'name': 'Can', 'supercategory': 'objects'},
+          4: {'id': 4, 'name': 'Cup', 'supercategory': 'objects'},
+      }
+
+      self.assertEqual(category_indices, expected_list)
+      self.assertEqual(category_index, expected_dict)
+
+    finally:
+      # Ensure the temporary file is deleted even if assertions fail
+      os.remove(temp_csv_path)
+
+  def test_files_paths_with_images(self):
+    # Create a temporary directory
+    with tempfile.TemporaryDirectory() as temp_dir:
+      # Create some image and non-image files
+      filenames = ['img2.jpg', 'img1.png', 'doc1.txt', 'photo.gif']
+      for filename in filenames:
+        open(os.path.join(temp_dir, filename), 'a').close()
+
+      # Call the function under test
+      result = utils.files_paths(temp_dir)
+
+      # Expected image files sorted naturally
+      expected = [
+          os.path.join(temp_dir, 'img1.png'),
+          os.path.join(temp_dir, 'img2.jpg'),
+          os.path.join(temp_dir, 'photo.gif'),
+      ]
+
+      self.assertEqual(result, expected)
+
+  def test_files_paths_with_no_images(self):
+    with tempfile.TemporaryDirectory() as temp_dir:
+      # Create only non-image files
+      filenames = ['doc1.txt', 'readme.md']
+      for filename in filenames:
+        open(os.path.join(temp_dir, filename), 'a').close()
+
+      result = utils.files_paths(temp_dir)
+      self.assertEqual(result, [])  # Should return an empty list
+
+  def test_files_paths_empty_folder(self):
+    with tempfile.TemporaryDirectory() as temp_dir:
+      result = utils.files_paths(temp_dir)
+      self.assertEqual(result, [])
+
+
+if __name__ == '__main__':
+  unittest.main()