OSUrobotics · lukestroh · Jul 7, 2023 · Jul 8, 2023 · Jul 9, 2023 · Jul 10, 2023
diff --git a/.flake8 b/.flake8
@@ -0,0 +1,8 @@
+[flake8]
+max-line-length = 120
+exclude = 
+    .git, 
+    __pycache__, 
+    build,
+    dist,
+    old
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,5 @@
+venv/
+points/
+
+meshes/
+bags/
diff --git a/.vscode/settings.json b/.vscode/settings.json
@@ -0,0 +1,6 @@
+{
+    "[python]": {
+        "editor.defaultFormatter": "ms-python.black-formatter"
+    },
+    "python.formatting.provider": "none"
+}
diff --git a/Image_based/BaseStatsImage.py b/Image_based/BaseStatsImage.py
@@ -0,0 +1,202 @@
+#!/usr/bin/env python3
+
+# Given a mask image name, read the image in and perform the following statistical calculations
+# PCA - find major and minor axes
+#  Find the bounding box, max width along the major axis
+#
+# Caches data in image name.json
+#
+
+
+import numpy as np
+import cv2
+from os.path import exists
+import json
+from line_seg_2d import LineSeg2D
+from HandleFileNames import HandleFileNames
+
+
+class BaseStatsImage:
+    _width = 0
+    _height = 0
+
+    _x_grid = None
+    _y_grid = None
+
+    @staticmethod
+    def _init_grid_(in_im):
+        """INitialize width, height, xgrid, etc so we don't have to keep re-making it
+        :param in_im: Input image
+        """
+        if BaseStatsImage._width == in_im.shape[1] and BaseStatsImage._height == in_im.shape[0]:
+            return
+        BaseStatsImage._width = in_im.shape[1]
+        BaseStatsImage._height = in_im.shape[0]
+
+        BaseStatsImage._x_grid, BaseStatsImage._y_grid = np.meshgrid(
+            np.linspace(0.5, BaseStatsImage._width - 0.5, BaseStatsImage._width),
+            np.linspace(0.5, BaseStatsImage._height - 0.5, BaseStatsImage._height),
+        )
+
+    def __init__(self, fname_mask_image, fname_calculated=None, fname_debug=None, b_recalc=False):
+        """Given an image, calculate the main axis and width along that axis
+          If fname_calculated is given, check to see if the data is already calculated - if so, read it in,
+          otherwise, calculate and write out
+          If fname_debug is given, the write out a debug image with the main axis and end points marked
+        @param fname_mask_image: name of mask file, rgb or gray scale image with white where the mask is
+        @param fname_calculated: the file name for the saved .json file; should be image name w/o _stats.json
+        @param fname_debug: the file name for a debug image showing the bounding box, etc
+        @param b_recalc: Force recalculate the result, y/n"""
+
+        self.stats_dict = None
+        mask_image_rgb = cv2.imread(fname_mask_image)
+        if len(mask_image_rgb.shape) == 3:
+            self.mask_image = cv2.cvtColor(mask_image_rgb, cv2.COLOR_BGR2GRAY)
+        else:
+            self.mask_image = mask_image_rgb
+        self._init_grid_(self.mask_image)
+
+        self.fname_calculated = None
+        if fname_calculated:
+            self.fname_calculated = fname_calculated + "_stats.json"
+
+        # Calculate the stats for this image
+        if b_recalc or not fname_calculated or not exists(fname_calculated):
+            # Cached data doesn't exist, or we need to re-calculated
+            self.stats_dict = self.stats_image(self.mask_image)
+
+            # TODO pull out into a read/write method
+            try:
+                # Convert any numpy arrays to lists prior to writing out
+                for k, v in self.stats_dict.items():
+                    try:
+                        if v.size == 2:
+                            self.stats_dict[k] = [v[0], v[1]]
+                    except AttributeError:
+                        pass
+                # If this fails, make a CalculatedData and DebugImages folder in the data/forcindy folder
+                with open(self.fname_calculated, "w") as f:
+                    json.dump(self.stats_dict, f, indent=2)
+            except FileNotFoundError:
+                if fname_calculated:
+                    print(f"BaseStats Image: File not found {fname_calculated}")
+        else:
+            with open(self.fname_calculated, "r") as f:
+                self.stats_dict = json.load(f)
+
+        # Undo the numpy array -> list
+        for k, v in self.stats_dict.items():
+            try:
+                if len(v) == 2:
+                    self.stats_dict[k] = np.array([v[0], v[1]])
+            except TypeError:
+                pass
+
+        if fname_debug:
+            im_debug = mask_image_rgb
+            if len(mask_image_rgb.shape) == 1:
+                im_debug = cv2.cvtColor(mask_image_rgb, cv2.COLOR_GRAY2RGB)
+            # Add the lines showing the eigen vecs
+            self.debug_image(im_debug)
+            cv2.imwrite(fname_debug, im_debug)
+
+    @staticmethod
+    def stats_image(in_im):
+        """Add statistics (bounding box, left right, orientation, radius] to image
+        Note: Could probably do this without transposing image, but...
+        Doing this as a static method so it can be used in a stand-alone pipeline
+        @param in_im gray scale image with mask non-zero
+        @returns stats as a dictionary of values"""
+
+        BaseStatsImage._init_grid_(in_im)
+
+        pixs_in_mask = in_im > 0
+
+        xs = BaseStatsImage._x_grid[pixs_in_mask]
+        ys = BaseStatsImage._y_grid[pixs_in_mask]
+
+        stats = {"x_min": np.min(xs), "y_min": np.min(ys), "x_max": np.max(xs), "y_max": np.max(ys)}
+        stats["x_span"] = stats["x_max"] - stats["x_min"]
+        stats["y_span"] = stats["y_max"] - stats["y_min"]
+
+        avg_width = 0.0
+        count_width = 0
+        if stats["x_span"] > stats["y_span"]:
+            stats["Direction"] = "left_right"
+            stats["Length"] = stats["x_span"]
+            for r in range(0, BaseStatsImage._width):
+                if sum(pixs_in_mask[:, r]) > 0:
+                    avg_width += sum(pixs_in_mask[:, r] > 0)
+                    count_width += 1
+        else:
+            stats["Direction"] = "up_down"
+            stats["Length"] = stats["y_span"]
+            for c in range(0, BaseStatsImage._height):
+                if sum(pixs_in_mask[c, :]) > 0:
+                    avg_width += sum(pixs_in_mask[c, :] > 0)
+                    count_width += 1
+        stats["width"] = avg_width / count_width
+        stats["center"] = np.array([np.mean(xs), np.mean(ys)])
+
+        x_matrix = np.zeros([2, xs.shape[0]])
+        x_matrix[0, :] = xs.transpose() - stats["center"][0]
+        x_matrix[1, :] = ys.transpose() - stats["center"][1]
+        covariance_matrix = np.cov(x_matrix)
+        eigen_values, eigen_vectors = np.linalg.eig(covariance_matrix)
+        if eigen_values[0] < eigen_values[1]:
+            stats["EigenValues"] = [np.min(eigen_values), np.max(eigen_values)]
+            stats["EigenVector"] = eigen_vectors[1, :]
+        else:
+            stats["EigenValues"] = [np.min(eigen_values), np.max(eigen_values)]
+            stats["EigenVector"] = eigen_vectors[0, :]
+        eigen_ratio = stats["EigenValues"][1] / stats["EigenValues"][0]
+        stats["EigenVector"][1] *= -1
+        stats["EigenMinorVector"] = np.array([stats["EigenVector"][1], -stats["EigenVector"][0]])
+        stats["EigenRatio"] = eigen_ratio
+        stats["lower_left"] = stats["center"] - stats["EigenVector"] * (stats["Length"] * 0.5)
+        stats["upper_right"] = stats["center"] + stats["EigenVector"] * (stats["Length"] * 0.5)
+        stats["left_edge"] = stats["center"] - stats["EigenMinorVector"] * (stats["width"] * 0.5)
+        stats["right_edge"] = stats["center"] + stats["EigenMinorVector"] * (stats["width"] * 0.5)
+        print(stats)
+        print(f"Eigen ratio {eigen_ratio}")
+        return stats
+
+    def debug_image(self, in_image):
+        """Draw the eigen vectors/points on the image. Note, this edits the image
+        @param in_image: The image to draw on top of"""
+        p1 = self.stats_dict["lower_left"]
+        p2 = self.stats_dict["upper_right"]
+        LineSeg2D.draw_line(in_image, p1, p2, (220, 128, 220), 2)
+
+        p1 = self.stats_dict["left_edge"]
+        p2 = self.stats_dict["right_edge"]
+        LineSeg2D.draw_line(in_image, p1, p2, (128, 128, 128), 2)
+
+        pc = self.stats_dict["center"]
+        LineSeg2D.draw_cross(in_image, pc, (256, 256, 128), 1, 2)
+
+        xmin = self.stats_dict["x_min"]
+        xmax = self.stats_dict["x_max"]
+        ymin = self.stats_dict["y_min"]
+        ymax = self.stats_dict["y_max"]
+        LineSeg2D.draw_rect(in_image, [[xmin, xmax], [ymin, ymax]], (256, 128, 128), 2)
+
+
+if __name__ == "__main__":
+    # path_bpd = "./data/trunk_segmentation_names.json"
+    path_bpd = "./data/forcindy_fnames.json"
+    all_files = HandleFileNames.read_filenames(path_bpd)
+
+    b_do_debug = True
+    b_do_recalc = False
+    for ind in all_files.loop_masks():
+        mask_fname = all_files.get_mask_name(path=all_files.path, index=ind, b_add_tag=True)
+        mask_fname_debug = all_files.get_mask_name(path=all_files.path_debug, index=ind, b_add_tag=True)
+        if not b_do_debug:
+            mask_fname_debug = ""
+
+        mask_fname_calculate = all_files.get_mask_name(path=all_files.path_calculated, index=ind, b_add_tag=False)
+
+        if not exists(mask_fname):
+            raise ValueError(f"Error, file {mask_fname} does not exist")
+        b_stats = BaseStatsImage(mask_fname, mask_fname_calculate, mask_fname_debug, b_recalc=b_do_recalc)