Spaces:

Detomo
/

eisei-tracability-ai

Running

App Files Files Community

vumichien commited on Sep 24, 2024

Commit

d2e5b70

verified ·

1 Parent(s): f723ada

Update main.py

Browse files

Files changed (1) hide show

main.py +108 -13

main.py CHANGED Viewed

@@ -72,13 +72,91 @@ LOGGING_CONFIG = {
 logging.config.dictConfig(LOGGING_CONFIG)
-def parse_detection(detections):
     parsed_rows = []
     for i in range(len(detections.xyxy)):
-        x_min = float(detections.xyxy[i][0])
-        y_min = float(detections.xyxy[i][1])
-        x_max = float(detections.xyxy[i][2])
-        y_max = float(detections.xyxy[i][3])
         width = int(x_max - x_min)
         height = int(y_max - y_min)
@@ -121,15 +199,29 @@ def infer(image):
     start_time = time.time()
     image_arr = np.frombuffer(image, np.uint8)
     image = cv2.imdecode(image_arr, cv2.IMREAD_COLOR)
-    image = cv2.resize(image, (1920, 1920))
     results = onnx_model(image)[0]
-    # detections = sv.Detections.from_ultralytics(results)
     slicer = sv.InferenceSlicer(callback=callback, slice_wh=(640, 640))
     detections = slicer(image=image)
     logging.info("Completed slicing and detection")
-    parsed_rows = parse_detection(detections)
     # Count the occurrences of each class
     class_counts = defaultdict(int)
     for detection in parsed_rows:
@@ -140,16 +232,19 @@ def infer(image):
     )
     logging.info(f"Summary info: {summary_info}")
     logging.info(f"Run time: {time.time() - start_time:.2f} seconds")
-    # label_annotator = sv.LabelAnnotator(text_color=sv.Color.BLACK)
-    bounding_box_annotator = sv.BoundingBoxAnnotator(thickness=4)
     annotated_image = image.copy()
     annotated_image = bounding_box_annotator.annotate(scene=annotated_image, detections=detections)
-    # annotated_image = label_annotator.annotate(scene=annotated_image, detections=detections)
-    # logging.info("Annotated image")
-    return annotated_image, parsed_rows
 @app.post("/process-image/")
 async def process_image(image: UploadFile = File(...), draw_boxes: bool = False):
     filename = image.filename

 logging.config.dictConfig(LOGGING_CONFIG)
+# def parse_detection(detections):
+#     parsed_rows = []
+#     for i in range(len(detections.xyxy)):
+#         x_min = float(detections.xyxy[i][0])
+#         y_min = float(detections.xyxy[i][1])
+#         x_max = float(detections.xyxy[i][2])
+#         y_max = float(detections.xyxy[i][3])
+#         width = int(x_max - x_min)
+#         height = int(y_max - y_min)
+#         row = {
+#             "top": int(y_min),
+#             "left": int(x_min),
+#             "width": width,
+#             "height": height,
+#             "class_id": ""
+#             if detections.class_id is None
+#             else int(detections.class_id[i]),
+#             "confidence": ""
+#             if detections.confidence is None
+#             else float(detections.confidence[i]),
+#             "tracker_id": ""
+#             if detections.tracker_id is None
+#             else int(detections.tracker_id[i]),
+#         }
+#         if hasattr(detections, "data"):
+#             for key, value in detections.data.items():
+#                 row[key] = (
+#                     str(value[i])
+#                     if hasattr(value, "__getitem__") and value.ndim != 0
+#                     else str(value)
+#                 )
+#         parsed_rows.append(row)
+#     return parsed_rows
+# # Run inference
+# def callback(image_slice: np.ndarray) -> sv.Detections:
+#     # logging.info("Running callback for image slice")
+#     results = onnx_model(image_slice)[0]
+#     return sv.Detections.from_ultralytics(results)
+# def infer(image):
+#     start_time = time.time()
+#     image_arr = np.frombuffer(image, np.uint8)
+#     image = cv2.imdecode(image_arr, cv2.IMREAD_COLOR)
+#     image = cv2.resize(image, (1920, 1920))
+#     results = onnx_model(image)[0]
+#     # detections = sv.Detections.from_ultralytics(results)
+#     slicer = sv.InferenceSlicer(callback=callback, slice_wh=(640, 640))
+#     detections = slicer(image=image)
+#     logging.info("Completed slicing and detection")
+#     parsed_rows = parse_detection(detections)
+#     # Count the occurrences of each class
+#     class_counts = defaultdict(int)
+#     for detection in parsed_rows:
+#         class_name = detection.get("class_name", "Unknown")
+#         class_counts[class_name] += 1
+#     summary_info = ", ".join(
+#         [f"{count} {class_name}" for class_name, count in class_counts.items()]
+#     )
+#     logging.info(f"Summary info: {summary_info}")
+#     logging.info(f"Run time: {time.time() - start_time:.2f} seconds")
+#     # label_annotator = sv.LabelAnnotator(text_color=sv.Color.BLACK)
+#     bounding_box_annotator = sv.BoundingBoxAnnotator(thickness=4)
+#     annotated_image = image.copy()
+#     annotated_image = bounding_box_annotator.annotate(scene=annotated_image, detections=detections)
+#     # annotated_image = label_annotator.annotate(scene=annotated_image, detections=detections)
+#     # logging.info("Annotated image")
+#     return annotated_image, parsed_rows
+def parse_detection(detections, scale_x, scale_y):
     parsed_rows = []
     for i in range(len(detections.xyxy)):
+        # Rescale the coordinates to match the original image size
+        x_min = float(detections.xyxy[i][0]) / scale_x
+        y_min = float(detections.xyxy[i][1]) / scale_y
+        x_max = float(detections.xyxy[i][2]) / scale_x
+        y_max = float(detections.xyxy[i][3]) / scale_y
         width = int(x_max - x_min)
         height = int(y_max - y_min)
     start_time = time.time()
     image_arr = np.frombuffer(image, np.uint8)
     image = cv2.imdecode(image_arr, cv2.IMREAD_COLOR)
+    # Get original dimensions
+    original_height, original_width = image.shape[:2]
+    # Resize image for detection
+    target_size = 1920
+    image = cv2.resize(image, (target_size, target_size))
+    # Compute scale factors
+    scale_x = target_size / original_width
+    scale_y = target_size / original_height
+    # Run model
     results = onnx_model(image)[0]
+    # Using slicer for detection
     slicer = sv.InferenceSlicer(callback=callback, slice_wh=(640, 640))
     detections = slicer(image=image)
     logging.info("Completed slicing and detection")
+    # Parse detections and adjust coordinates to original size
+    parsed_rows = parse_detection(detections, scale_x, scale_y)
     # Count the occurrences of each class
     class_counts = defaultdict(int)
     for detection in parsed_rows:
     )
     logging.info(f"Summary info: {summary_info}")
     logging.info(f"Run time: {time.time() - start_time:.2f} seconds")
+    # Annotate the resized image
+    bounding_box_annotator = sv.BoundingBoxAnnotator(thickness=4)
     annotated_image = image.copy()
     annotated_image = bounding_box_annotator.annotate(scene=annotated_image, detections=detections)
+    # Resize the annotated image back to original dimensions
+    annotated_image = cv2.resize(annotated_image, (original_width, original_height))
+    # Return the resized annotated image and parsed detection results
+    return annotated_image, parsed_rows
 @app.post("/process-image/")
 async def process_image(image: UploadFile = File(...), draw_boxes: bool = False):
     filename = image.filename