Fix Windows non-UTF source filenames (#4524)

Co-authored-by: Kayzwer <68285002+Kayzwer@users.noreply.github.com>
2023-08-24 03:22:26 +02:00 · 2023-08-24 03:22:26 +02:00 · 1db9afc2e5
commit 1db9afc2e5
parent a7419617a6
16 changed files with 129 additions and 95 deletions
--- a/ultralytics/data/augment.py
+++ b/ultralytics/data/augment.py
@ -634,7 +634,7 @@ class CopyPaste:

            result = cv2.flip(im, 1)  # augment segments (flip left-right)
            i = cv2.flip(im_new, 1).astype(bool)
-            im[i] = result[i]  # cv2.imwrite('debug.jpg', im)  # debug
+            im[i] = result[i]

        labels['img'] = im
        labels['cls'] = cls
--- a/ultralytics/data/converter.py
+++ b/ultralytics/data/converter.py
@ -9,8 +9,6 @@ import cv2
 import numpy as np
 from tqdm import tqdm

-from ultralytics.utils.checks import check_requirements
-

 def coco91_to_coco80_class():
    """Converts 91-index COCO class IDs to 80-index COCO class IDs.
@ -18,7 +16,6 @@ def coco91_to_coco80_class():
    Returns:
        (list): A list of 91 class IDs where the index represents the 80-index class ID and the value is the
            corresponding 91-index class ID.
-
    """
    return [
        0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, None, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, None, 24, 25, None,
@ -119,9 +116,7 @@ def convert_coco(labels_dir='../coco/annotations/', use_segments=False, use_keyp
                    if len(ann['segmentation']) == 0:
                        segments.append([])
                        continue
-                    if isinstance(ann['segmentation'], dict):
-                        ann['segmentation'] = rle2polygon(ann['segmentation'])
-                    if len(ann['segmentation']) > 1:
+                    elif len(ann['segmentation']) > 1:
                        s = merge_multi_segment(ann['segmentation'])
                        s = (np.concatenate(s, axis=0) / np.array([w, h])).reshape(-1).tolist()
                    else:
@ -131,9 +126,8 @@ def convert_coco(labels_dir='../coco/annotations/', use_segments=False, use_keyp
                    if s not in segments:
                        segments.append(s)
                if use_keypoints and ann.get('keypoints') is not None:
-                    k = (np.array(ann['keypoints']).reshape(-1, 3) / np.array([w, h, 1])).reshape(-1).tolist()
-                    k = box + k
-                    keypoints.append(k)
+                    keypoints.append(box + (np.array(ann['keypoints']).reshape(-1, 3) /
+                                            np.array([w, h, 1])).reshape(-1).tolist())

            # Write
            with open((fn / f).with_suffix('.txt'), 'a') as file:
@ -237,34 +231,6 @@ def convert_dota_to_yolo_obb(dota_root_path: str):
            convert_label(image_name_without_ext, w, h, orig_label_dir, save_dir)


-def rle2polygon(segmentation):
-    """
-    Convert Run-Length Encoding (RLE) mask to polygon coordinates.
-
-    Args:
-        segmentation (dict, list): RLE mask representation of the object segmentation.
-
-    Returns:
-        (list): A list of lists representing the polygon coordinates for each contour.
-
-    Note:
-        Requires the 'pycocotools' package to be installed.
-    """
-    check_requirements('pycocotools')
-    from pycocotools import mask
-
-    m = mask.decode(segmentation)
-    m[m > 0] = 255
-    contours, _ = cv2.findContours(m, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_TC89_KCOS)
-    polygons = []
-    for contour in contours:
-        epsilon = 0.001 * cv2.arcLength(contour, True)
-        contour_approx = cv2.approxPolyDP(contour, epsilon, True)
-        polygon = contour_approx.flatten().tolist()
-        polygons.append(polygon)
-    return polygons
-
-
 def min_index(arr1, arr2):
    """
    Find a pair of indexes with the shortest distance between two arrays of 2D points.
--- a/ultralytics/data/utils.py
+++ b/ultralytics/data/utils.py
@ -144,9 +144,7 @@ def verify_image_label(args):
        if keypoint:
            keypoints = lb[:, 5:].reshape(-1, nkpt, ndim)
            if ndim == 2:
-                kpt_mask = np.ones(keypoints.shape[:2], dtype=np.float32)
-                kpt_mask = np.where(keypoints[..., 0] < 0, 0.0, kpt_mask)
-                kpt_mask = np.where(keypoints[..., 1] < 0, 0.0, kpt_mask)
+                kpt_mask = np.where((keypoints[..., 0] < 0) | (keypoints[..., 1] < 0), 0.0, 1.0).astype(np.float32)
                keypoints = np.concatenate([keypoints, kpt_mask[..., None]], axis=-1)  # (nl, nkpt, 3)
        lb = lb[:, :5]
        return im_file, lb, shape, segments, keypoints, nm, nf, ne, nc, msg
--- a/ultralytics/engine/exporter.py
+++ b/ultralytics/engine/exporter.py
@ -127,7 +127,7 @@ class Exporter:

    Attributes:
        args (SimpleNamespace): Configuration for the exporter.
-        save_dir (Path): Directory to save results.
+        callbacks (list, optional): List of callback functions. Defaults to None.
    """

    def __init__(self, cfg=DEFAULT_CFG, overrides=None, _callbacks=None):
@ -189,7 +189,7 @@ class Exporter:
        model.eval()
        model.float()
        model = model.fuse()
-        for k, m in model.named_modules():
+        for m in model.modules():
            if isinstance(m, (Detect, RTDETRDecoder)):  # Segment and Pose use Detect base class
                m.dynamic = self.args.dynamic
                m.export = True
@ -427,7 +427,7 @@ class Exporter:
            system = 'macos' if MACOS else 'ubuntu' if LINUX else 'windows'  # operating system
            asset = [x for x in assets if system in x][0] if assets else \
                f'https://github.com/pnnx/pnnx/releases/download/20230816/pnnx-20230816-{system}.zip'  # fallback
-            attempt_download_asset(asset, repo='pnnx/pnnx', release='latest')
+            asset = attempt_download_asset(asset, repo='pnnx/pnnx', release='latest')
            unzip_dir = Path(asset).with_suffix('')
            pnnx = ROOT / pnnx_filename  # new location
            (unzip_dir / pnnx_filename).rename(pnnx)  # move binary to ROOT
@ -502,9 +502,9 @@ class Exporter:
                check_requirements('scikit-learn')  # scikit-learn package required for k-means quantization
            if mlmodel:
                ct_model = ct.models.neural_network.quantization_utils.quantize_weights(ct_model, bits, mode)
-            else:
+            elif bits == 8:  # mlprogram already quantized to FP16
                import coremltools.optimize.coreml as cto
-                op_config = cto.OpPalettizerConfig(mode=mode, nbits=bits, weight_threshold=512)
+                op_config = cto.OpPalettizerConfig(mode='kmeans', nbits=bits, weight_threshold=512)
                config = cto.OptimizationConfig(global_config=op_config)
                ct_model = cto.palettize_weights(ct_model, config=config)
        if self.args.nms and self.model.task == 'detect':
@ -839,7 +839,7 @@ class Exporter:
        import coremltools as ct  # noqa

        LOGGER.info(f'{prefix} starting pipeline with coremltools {ct.__version__}...')
-        batch_size, ch, h, w = list(self.im.shape)  # BCHW
+        _, _, h, w = list(self.im.shape)  # BCHW

        # Output shapes
        spec = model.get_spec()
@ -857,8 +857,8 @@ class Exporter:
        # Checks
        names = self.metadata['names']
        nx, ny = spec.description.input[0].type.imageType.width, spec.description.input[0].type.imageType.height
-        na, nc = out0_shape
-        # na, nc = out0.type.multiArrayType.shape  # number anchors, classes
+        _, nc = out0_shape  # number of anchors, number of classes
+        # _, nc = out0.type.multiArrayType.shape
        assert len(names) == nc, f'{len(names)} names found for nc={nc}'  # check

        # Define output shapes (missing)
@ -968,7 +968,7 @@ class IOSDetectModel(torch.nn.Module):
    def __init__(self, model, im):
        """Initialize the IOSDetectModel class with a YOLO model and example image."""
        super().__init__()
-        b, c, h, w = im.shape  # batch, channel, height, width
+        _, _, h, w = im.shape  # batch, channel, height, width
        self.model = model
        self.nc = len(model.names)  # number of classes
        if w == h:
--- a/ultralytics/engine/predictor.py
+++ b/ultralytics/engine/predictor.py
@ -343,8 +343,7 @@ class BasePredictor:
                    h = int(vid_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
                else:  # stream
                    fps, w, h = 30, im0.shape[1], im0.shape[0]
-                suffix = '.mp4' if MACOS else '.avi' if WINDOWS else '.avi'
-                fourcc = 'avc1' if MACOS else 'WMV2' if WINDOWS else 'MJPG'
+                suffix, fourcc = ('.mp4', 'avc1') if MACOS else ('.avi', 'WMV2') if WINDOWS else ('.avi', 'MJPG')
                save_path = str(Path(save_path).with_suffix(suffix))
                self.vid_writer[idx] = cv2.VideoWriter(save_path, cv2.VideoWriter_fourcc(*fourcc), fps, (w, h))
            self.vid_writer[idx].write(im0)
--- a/ultralytics/nn/tasks.py
+++ b/ultralytics/nn/tasks.py
@ -261,7 +261,6 @@ class DetectionModel(BaseModel):
        for si, fi in zip(s, f):
            xi = scale_img(x.flip(fi) if fi else x, si, gs=int(self.stride.max()))
            yi = super().predict(xi)[0]  # forward
-            # cv2.imwrite(f'img_{si}.jpg', 255 * xi[0].cpu().numpy().transpose((1, 2, 0))[:, :, ::-1])  # save
            yi = self._descale_pred(yi, fi, si, img_size)
            y.append(yi)
        y = self._clip_augmented(y)  # clip augmented tails
--- a/ultralytics/utils/init.py
+++ b/ultralytics/utils/init.py
@ -852,9 +852,10 @@ ENVIRONMENT = 'Colab' if is_colab() else 'Kaggle' if is_kaggle() else 'Jupyter'
 TESTS_RUNNING = is_pytest_running() or is_github_actions_ci()
 set_sentry()

-# Apply monkey patches if the script is being run from within the parent directory of the script's location
-from .patches import imread, imshow, imwrite
+# Apply monkey patches
+from .patches import imread, imshow, imwrite, torch_save

-# torch.save = torch_save
-if Path(inspect.stack()[0].filename).parent.parent.as_posix() in inspect.stack()[-1].filename:
+torch.save = torch_save
+if WINDOWS:
+    # Apply cv2 patches for non-ASCII and non-UTF characters in image paths
    cv2.imread, cv2.imwrite, cv2.imshow = imread, imwrite, imshow
--- a/ultralytics/utils/benchmarks.py
+++ b/ultralytics/utils/benchmarks.py
@ -240,7 +240,7 @@ class ProfileModels:
            if path.is_dir():
                extensions = ['*.pt', '*.onnx', '*.yaml']
                files.extend([file for ext in extensions for file in glob.glob(str(path / ext))])
-            elif path.suffix in ('.pt', '.yaml', '.yml'):  # add non-existing
+            elif path.suffix in {'.pt', '.yaml', '.yml'}:  # add non-existing
                files.append(str(path))
            else:
                files.extend(glob.glob(str(path)))
@ -262,7 +262,7 @@ class ProfileModels:
            data = clipped_data
        return data

-    def profile_tensorrt_model(self, engine_file: str):
+    def profile_tensorrt_model(self, engine_file: str, eps: float = 1e-7):
        if not self.trt or not Path(engine_file).is_file():
            return 0.0, 0.0

@ -279,7 +279,7 @@ class ProfileModels:
            elapsed = time.time() - start_time

        # Compute number of runs as higher of min_time or num_timed_runs
-        num_runs = max(round(self.min_time / elapsed * self.num_warmup_runs), self.num_timed_runs * 50)
+        num_runs = max(round(self.min_time / (elapsed + eps) * self.num_warmup_runs), self.num_timed_runs * 50)

        # Timed runs
        run_times = []
@ -290,7 +290,7 @@ class ProfileModels:
        run_times = self.iterative_sigma_clipping(np.array(run_times), sigma=2, max_iters=3)  # sigma clipping
        return np.mean(run_times), np.std(run_times)

-    def profile_onnx_model(self, onnx_file: str):
+    def profile_onnx_model(self, onnx_file: str, eps: float = 1e-7):
        check_requirements('onnxruntime')
        import onnxruntime as ort

@ -330,7 +330,7 @@ class ProfileModels:
            elapsed = time.time() - start_time

        # Compute number of runs as higher of min_time or num_timed_runs
-        num_runs = max(round(self.min_time / elapsed * self.num_warmup_runs), self.num_timed_runs)
+        num_runs = max(round(self.min_time / (elapsed + eps) * self.num_warmup_runs), self.num_timed_runs)

        # Timed runs
        run_times = []
--- a/ultralytics/utils/downloads.py
+++ b/ultralytics/utils/downloads.py
@ -101,7 +101,11 @@ def zip_directory(directory, compress=True, exclude=('.DS_Store', '__MACOSX'), p
    zip_file = directory.with_suffix('.zip')
    compression = ZIP_DEFLATED if compress else ZIP_STORED
    with ZipFile(zip_file, 'w', compression) as f:
-        for file in tqdm(files_to_zip, desc=f'Zipping {directory} to {zip_file}...', unit='file', disable=not progress):
+        for file in tqdm(files_to_zip,
+                         desc=f'Zipping {directory} to {zip_file}...',
+                         unit='file',
+                         disable=not progress,
+                         bar_format=TQDM_BAR_FORMAT):
            f.write(file, file.relative_to(directory))

    return zip_file  # return path to zip file
@ -159,7 +163,11 @@ def unzip_file(file, path=None, exclude=('.DS_Store', '__MACOSX'), exist_ok=Fals
            LOGGER.info(f'Skipping {file} unzip (already unzipped)')
            return path

-        for f in tqdm(files, desc=f'Unzipping {file} to {Path(path).resolve()}...', unit='file', disable=not progress):
+        for f in tqdm(files,
+                      desc=f'Unzipping {file} to {Path(path).resolve()}...',
+                      unit='file',
+                      disable=not progress,
+                      bar_format=TQDM_BAR_FORMAT):
            zipObj.extract(f, path=extract_path)

    return path  # return unzip dir
--- a/ultralytics/utils/patches.py
+++ b/ultralytics/utils/patches.py
@ -13,20 +13,45 @@ import torch
 _imshow = cv2.imshow  # copy to avoid recursion errors


-def imread(filename, flags=cv2.IMREAD_COLOR):
+def imread(filename: str, flags: int = cv2.IMREAD_COLOR):
+    """Read an image from a file.
+
+    Args:
+        filename (str): Path to the file to read.
+        flags (int, optional): Flag that can take values of cv2.IMREAD_*. Defaults to cv2.IMREAD_COLOR.
+
+    Returns:
+        (np.ndarray): The read image.
+    """
    return cv2.imdecode(np.fromfile(filename, np.uint8), flags)


-def imwrite(filename, img):
+def imwrite(filename: str, img: np.ndarray, params=None):
+    """Write an image to a file.
+
+    Args:
+        filename (str): Path to the file to write.
+        img (np.ndarray): Image to write.
+        params (list of ints, optional): Additional parameters. See OpenCV documentation.
+
+    Returns:
+        (bool): True if the file was written, False otherwise.
+    """
    try:
-        cv2.imencode(Path(filename).suffix, img)[1].tofile(filename)
+        cv2.imencode(Path(filename).suffix, img, params)[1].tofile(filename)
        return True
    except Exception:
        return False


-def imshow(path, im):
-    _imshow(path.encode('unicode_escape').decode(), im)
+def imshow(winname: str, mat: np.ndarray):
+    """Displays an image in the specified window.
+
+    Args:
+        winname (str): Name of the window.
+        mat (np.ndarray): Image to be shown.
+    """
+    _imshow(winname.encode('unicode_escape').decode(), mat)


 # PyTorch functions ----------------------------------------------------------------------------------------------------
@ -34,12 +59,17 @@ _torch_save = torch.save  # copy to avoid recursion errors


 def torch_save(*args, **kwargs):
-    """Use dill (if exists) to serialize the lambda functions where pickle does not do this."""
+    """Use dill (if exists) to serialize the lambda functions where pickle does not do this.
+
+    Args:
+        *args (tuple): Positional arguments to pass to torch.save.
+        **kwargs (dict): Keyword arguments to pass to torch.save.
+    """
    try:
-        import dill as pickle
+        import dill as pickle  # noqa
    except ImportError:
        import pickle

    if 'pickle_module' not in kwargs:
-        kwargs['pickle_module'] = pickle
+        kwargs['pickle_module'] = pickle  # noqa
    return _torch_save(*args, **kwargs)