Skip to content

Commit

Permalink
add a __main__ self-test configured with a json file
Browse files Browse the repository at this point in the history
- the __main__ self-test can load an image from a file
  or use the video stream from a camera
- It takes the path to a json file that specifies a
  list of image transforms, there order and their arguments
- functions have been added to load and parse the json file
  and use it to construct the transform pipeline.
- The transform pipeline is implemented with a run() method
  that applies the transforms in order.
- Comments in the code document the json file format.
  • Loading branch information
Ezward committed Jun 26, 2023
1 parent 3dee532 commit 5d2a841
Showing 1 changed file with 363 additions and 3 deletions.
366 changes: 363 additions & 3 deletions donkeycar/parts/image_transformations.py
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,15 @@ def image_transformer(name: str, config):
config.ROI_TRAPEZE_MIN_Y,
config.ROI_TRAPEZE_MAX_Y
)

elif "TRAPEZE_EDGE" == name:
return cv_parts.ImgTrapezoidalEdgeMask(
config.ROI_TRAPEZE_UL,
config.ROI_TRAPEZE_UR,
config.ROI_TRAPEZE_LL,
config.ROI_TRAPEZE_LR,
config.ROI_TRAPEZE_MIN_Y,
config.ROI_TRAPEZE_MAX_Y
)
elif "CROP" == name:
return cv_parts.ImgCropMask(
config.ROI_CROP_LEFT,
Expand All @@ -75,7 +83,7 @@ def image_transformer(name: str, config):
return cv_parts.ImgHSV2BGR()
elif "RGB2GRAY" == name:
return cv_parts.ImgRGB2GRAY()
elif "RBGR2GRAY" == name:
elif "BGR2GRAY" == name:
return cv_parts.ImgBGR2GRAY()
elif "HSV2GRAY" == name:
return cv_parts.ImgHSV2GRAY()
Expand Down Expand Up @@ -108,7 +116,7 @@ def image_transformer(name: str, config):
elif name.startswith("CUSTOM"):
return custom_transformer(name, config)
else:
msg = f"{name} is not a valid augmentation"
msg = f"{name} is not a valid transformation"
logger.error(msg)
raise ValueError(msg)

Expand Down Expand Up @@ -213,3 +221,355 @@ def run(self, image):
else:
raise ValueError(f"Unable to load custom tranformation module at {file_path}")


class ImgTransformList:
"""
A list of image transforms supplied by
a json file and run in the order and with
the arguments specified in the json.
"""
def __init__(self, transforms) -> None:
self.transforms = transforms

@staticmethod
def fromJson(filepath):
config = loadImgTransformJson(filepath)
transforms = imgTransformListFromJson(config)
return ImgTransformList(transforms)

def run(self, image):
for transform in self.transforms:
image = transform.run(image)
return image

def shutdown(self):
for transform in self.transforms:
if callable(getattr(transform, "shutdown", None)):
transform.shutdown()


def imgTransformFromJson(transform_config):
"""
Construct a single Image transform from given dictionary.
The dictionary corresponds the the image transform's
constructor arguments, so it can be passed to the
constructure using object destructuring.
"""
if not isinstance(transform_config, object):
raise TypeError("transform_config must be a dictionary")


#
# a config is a [string, object] pair
# where the string specifies the transform
# and the optional object provides the arguments
# to it's constructor.
#
transformation = transform_config[0]
args = transform_config[1] if len(transform_config) == 2 else None
transformer = None

#
# masking transformations
#
if "TRAPEZE_EDGE" == transformation:
transformer = cv_parts.ImgTrapezoidalEdgeMask(**args)
elif 'CROP' == transformation:
transformer = cv_parts.ImgCropMask(**args)

#
# color space transformations
#
elif "RGB2BGR" == transformation:
transformer = cv_parts.ImgRGB2BGR()
elif "BGR2RGB" == transformation:
transformer = cv_parts.ImgBGR2RGB()
elif "RGB2HSV" == transformation:
transformer = cv_parts.ImgRGB2HSV()
elif "HSV2RGB" == transformation:
transformer = cv_parts.ImgHSV2RGB()
elif "BGR2HSV" == transformation:
transformer = cv_parts.ImgBGR2HSV()
elif "HSV2BGR" == transformation:
transformer = cv_parts.ImgHSV2BGR()
elif "RGB2GREY" == transformation or "RGB2GRAY" == transformation:
transformer = cv_parts.ImgRGB2GRAY()
elif "GREY2RGB" == transformation or "GRAY2RGB" == transformation:
transformer = cv_parts.ImgGRAY2RGB()
elif "BGR2GREY" == transformation or "BGR2GRAY" == transformation:
transformer = cv_parts.ImgBGR2GRAY()
elif "GREY2BGR" == transformation or "GRAY2BGR" == transformation:
transformer = cv_parts.ImgGRAY2BGR()
elif "HSV2GREY" == transformation or "HSV2GRAY" == transformation:
transformer = cv_parts.ImgHSV2GRAY()
elif "CANNY" == transformation:
# canny edge detection
transformer = cv_parts.ImgCanny(**args)
#
# blur transformations
#
elif "GBLUR" == transformation:
transformer = cv_parts.ImgGaussianBlur(**args)
elif "BLUR" == transformation:
transformer = cv_parts.ImgSimpleBlur(**args)
#
# resize transformations
#
elif "RESIZE" == transformation:
transformer = cv_parts.ImageResize(**args)
elif "SCALE" == transformation:
transformer = cv_parts.ImageScale(args.scale, args.scale_height)

#
# custom transform
#
elif transformation.startswith("CUSTOM"):
transformer = custom_transformer(transformation, args)

#
# not a valid transform name
#
else:
msg = f"'{transformation}' is not a valid transformation"
logger.error(msg)
raise ValueError(msg)

return transformer



def imgTransformListFromJson(transforms_config):
"""
Parse one or more Image transforms from given list
and return an ImgTransformer that applies
them with the arguments and in the order given
in the file.
"""
if not isinstance(transforms_config, list):
raise TypeError("transforms_config must be a list")

transformers = []

for transform_config in transforms_config:
transformers.append(imgTransformFromJson(transform_config))

return transformers



def loadImgTransformJson(filepath):
"""
Load a json file that specifies a list with one or more
image transforms, their order and their arguments.
The list will contain a series of tuples as a two
element list. The first element of the tuple is the name
of the transform and the second element is a dictionary
the named arguments for the transform's constructor.
The named arguments using object destructuring except
for the custom transform where the dictionary is
pass as-is without destructuring.
You can look at the constructor for each image transform
in cv.py to see what the fields of the argument object in
the json should be. You may leave out an argument if it
has a default.
Here is an example that has one of each transformtion
specified with all of it's arguments.
```
[
["BGR2GRAY"],
["BGR2HSV"],
["BGR2RGB"],
["BLUR", {"kernel_size": 5, "kernel_y": null}],
["CANNY", {"low_threshold": 60, "high_threshold": 110, "aperture_size": 3, "l2gradient": false}],
["CROP", {"left": 0, "top": 0, "right": 0, "bottom": 0}],
["GBLUR", {"kernel_size": 5, "kernel_y": null}],
["GRAY2BGR"],
["GRAY2RGB"],
["HSV2BGR"],
["HSV2RGB"],
["HSV2GRAY"],
["RESIZE", {"width": 160, "height": 120}],
["RGB2BGR"],
["RGB2GRAY"],
["RGB2HSV"],
["SCALE", {"scale": 1.0, "scale_height": null}],
["TRAPEZE", {"left":0, "right":0, "bottom_left":0, "bottom_right":0, "top":0, "bottom":0, "fill": [255,255,255]}],
["TRAPEZE_EDGE", {"upper_left":0, "upper_right":0, "lower_left":0, "lower_right":0, "top":0, "bottom":0, "fill": [255,255,255]}]
]
```
"""
import json

#
# load and parse the file
#
try:
with open(filepath) as f:
try:
data = json.load(f)
#
# TODO: validate json data against a schema
#
return data
except e:
logger.error(f"Can't parse transforms json due to error: {e}")
raise e
except OSError as e:
logger.error(f"Can't open transforms json file '{filepath}' due to error: {e}")
raise e

if __name__ == "__main__":
"""
Image transforms self test.
You provide a json file that specifies a transformation pipeline
and configure either an single image to be loaded or a camera to be used.
The image transformation pipeline is constructed and applied the
the configured image source and shown in an opencv window.
This json specifies a pipeline that applies canny edge detection to the image.
```
[
["RGB2GRAY"],
["BLUR", {}],
["CANNY", {}],
["CROP", {"left": 0, "top": 45, "right": 0, "bottom": 0}],
["GRAY2RGB"]
]
```
Here the "BLUR" and "CANNY" transforms are using default parameters, so the
argument object is empty. The "CROP" transform is supplied with a argument object
that specifies all named parameters and their values. The color conversion transforms
"RGB2GRAY" and "GRAY2RGB" do not have arguments so no argument object is supplied.
If it was in a json file named `canny_pipeline.json` in `pi` home folder the usage would be:
```
cd donkeycar/parts
python image_transformations.py --width=640 --height=480 --json=/Home/pi/canny_pipeline.json
```
"""
import argparse
import sys
import time
import cv2
import numpy as np
import logging

# parse arguments
parser = argparse.ArgumentParser()
parser.add_argument("-c", "--camera", type=int, default=0,
help = "index of camera if using multiple cameras")
parser.add_argument("-wd", "--width", type=int, default=160,
help = "width of image to capture")
parser.add_argument("-ht", "--height", type=int, default=120,
help = "height of image to capture")
parser.add_argument("-f", "--file", type=str,
help = "path to image file to user rather that a camera")
parser.add_argument("-js", "--json", type=str,
help = "path to json file with list of tranforms")


# Read arguments from command line
args = parser.parse_args()

image_source = None
help = []
if args.file is None:
if args.camera < 0:
help.append("-c/--camera must be >= 0")
if args.width is None or args.width < 160:
help.append("-wd/--width must be >= 160")
if args.height is None or args.height < 120:
help.append("-ht/--height must be >= 120")

if args.json is None:
help.append("-js/--json must be supplied to specify the json file with transformers.")


if len(help) > 0:
parser.print_help()
for h in help:
print(" " + h)
sys.exit(1)

#
# load file OR setup camera
#
cap = None
width = None
height = None
depth = 3
if args.file is not None:
print(f"Loading image from file `{args.file}`...")
image_source = cv_parts.CvImgFromFile(args.file, image_w=args.width, image_h=args.height, copy=True)
height, width, depth = cv_parts.image_shape(image_source.run())
else:
print("Initializing camera...")
width = args.width
height = args.height
image_source = cv_parts.CvCam(image_w=width, image_h=height, iCam=args.camera)
print("done.")

#
# read list transformations from json file
# with fields like:
#
# [
# ["BGR2GRAY"],
# ["BGR2HSV"],
# ["BGR2RGB"],
# ["BLUR", {"gaussian": false, "kernel": 5, "kernel_y": null}]
# ["CANNY", {"low_threshold": 60, "high_threshold": 110, "aperture": 3}]
# ["CROP", {"left": 0, "top": 0, "right": 0, "bottom": 0}],
# ["GRAY2BGR"],
# ["GRAY2RGB"],
# ["HSV2BGR"],
# ["HSV2RGB"],
# ["HSV2GRAY"],
# ["RESIZE", {"width": 160, "height": 120}],
# ["RGB2BGR"],
# ["RGB2GRAY"],
# ["RGB2HSV"],
# ["SCALE", {"scale_width": 1.0, "scale_height": 1.0}],
# ["TRAPEZE", {"upper_left":0, "upper_right":0, "lower_left":0, "lower_right":0, "top":0, "bottom":0}]
# ]
#
print("Loading tranform list from json file `{args.json}`...")
transformer = ImgTransformList.fromJson(args.json)
print("done.")

# Creating a window for later use
window_name = 'image_tranformer'
cv2.namedWindow(window_name)

while(1):

frame = image_source.run()

#
# apply the augmentation
#
transformed_image = transformer.run(frame)

#
# show augmented image
#
cv2.imshow(window_name, transformed_image)

k = cv2.waitKey(5) & 0xFF
if k == ord('q') or k == ord('Q'): # 'Q' or 'q'
break

if cap is not None:
cap.release()

cv2.destroyAllWindows()

0 comments on commit 5d2a841

Please sign in to comment.