AutoLabelWithYolo/image_editor.py at master · gzxy0102/AutoLabelWithYolo · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
import logging
from typing import List, Dict, Optional, Tuple, Any

import cv2
from PySide6.QtCore import (Qt, QRect, QPoint, Signal)
from PySide6.QtGui import (QPixmap, QImage, QPainter, QPen, QColor, QFont)
from PySide6.QtWidgets import (QLabel, QMessageBox, QMenu, QInputDialog)

from utils import generate_distinct_colors

# 配置日志记录
logger = logging.getLogger(__name__)


class ImageEditor(QLabel):
    """图片编辑器，用于显示图片和编辑标注框，支持彩色标签"""
    annotation_updated = Signal(list)

    def __init__(self, parent=None):
        super().__init__(parent)

        # 在__init__中定义所有实例属性
        self.image: Optional[Any] = None
        self.q_image: Optional[QImage] = None
        self.annotations: List[Dict] = []
        self.class_names: List[str] = []
        self.class_colors: List[Tuple[int, int, int]] = []
        self.current_box_idx: int = -1
        self.dragging: bool = False
        self.drag_handle: Optional[str] = None  # None, 'top_left', 'top_right', 'bottom_left', 'bottom_right', 'center'
        self.last_pos = QPoint()
        self.box_offset = QPoint()

        # 添加一个标志，表示是否在拖拽过程中
        self.during_drag_operation: bool = False

        # 缓存颜色字典，提高查找性能
        self._color_cache: Dict[str, Tuple[int, int, int]] = {}

        # 添加窗口关闭标志
        self.closing: bool = False

        self.init_ui()

    def init_ui(self):
        self.setMinimumSize(640, 480)
        # 修正Qt.AlignCenter的引用
        self.setAlignment(Qt.AlignmentFlag.AlignCenter)

    @property
    def current_annotation(self):
        """获取当前选中的标注框"""
        if 0 <= self.current_box_idx < len(self.annotations):
            return self.annotations[self.current_box_idx]
        return None

    @property
    def has_selection(self):
        """检查是否有选中的标注框"""
        return 0 <= self.current_box_idx < len(self.annotations)

    @property
    def has_annotations(self):
        """检查是否有标注"""
        return len(self.annotations) > 0

    def set_image(self, image):
        """设置显示的图片"""
        self.image = image
        self.update_q_image()
        self.annotations = []
        self.current_box_idx = -1
        self.update()

    def update_q_image(self):
        """将OpenCV图像转换为Qt图像"""
        if self.image is None:
            self.q_image = None
            return

        height, width, channel = self.image.shape
        bytes_per_line = 3 * width
        rgb_image = cv2.cvtColor(self.image, cv2.COLOR_BGR2RGB)
        self.q_image = QImage(rgb_image.data, width, height, bytes_per_line, QImage.Format.Format_RGB888)
        # 修正Qt.KeepAspectRatio和Qt.SmoothTransformation的引用
        self.setPixmap(QPixmap.fromImage(self.q_image).scaled(
            self.size(), Qt.AspectRatioMode.KeepAspectRatio, Qt.TransformationMode.SmoothTransformation))

    def set_annotations(self, annotations):
        """设置标注信息"""
        self.annotations = annotations.copy()
        self.current_box_idx = -1
        self.update()

    def set_class_info(self, class_names: List[str], class_colors: List[Tuple[int, int, int]]) -> None:
        """设置标签列表和对应的颜色"""
        self.class_names = class_names.copy()
        # 确保颜色数量与标签数量一致
        if len(class_colors) != len(class_names):
            self.class_colors = generate_distinct_colors(len(class_names))
        else:
            self.class_colors = class_colors.copy()

        # 重新构建颜色缓存
        self._color_cache = dict(zip(self.class_names, self.class_colors))
        logger.debug(f"已更新标签信息：{len(self.class_names)}个标签")

    # 移除不再需要的class_color_cache属性，直接使用_color_cache

    def get_class_color(self, class_name: str) -> Tuple[int, int, int]:
        """获取标签对应的颜色，如果没有则返回默认颜色"""
        # 首先尝试从缓存中获取
        if class_name in self._color_cache:
            return self._color_cache[class_name]

        try:
            idx = self.class_names.index(class_name)
            color = self.class_colors[idx]
            # 更新缓存
            self._color_cache[class_name] = color
            return color
        except ValueError:
            # 对于未知标签，使用默认绿色并缓存
            default_color = (0, 255, 0)
            self._color_cache[class_name] = default_color
            return default_color

    def paintEvent(self, event):
        # 在窗口关闭时避免绘制
        if self.closing:
            return

        # 添加基本条件检查
        if self.q_image is None:
            return
        """绘制事件，用于显示图片和带颜色的标注框"""
        super().paintEvent(event)

        painter = QPainter(self)
        painter.setRenderHint(QPainter.RenderHint.Antialiasing)

        # 计算缩放比例
        pixmap = self.pixmap()
        if pixmap.isNull():
            return

        # 计算图片在 QLabel 中的偏移量（居中显示时的偏移）
        pixmap_x = (self.width() - pixmap.width()) // 2
        pixmap_y = (self.height() - pixmap.height()) // 2

        # 确保self.image存在且有效
        if self.image is None:
            return

        try:
            scale_x = pixmap.width() / self.image.shape[1]
            scale_y = pixmap.height() / self.image.shape[0]
        except (AttributeError, IndexError) as e:
            logger.error(f"计算缩放比例时出错: {str(e)}")
            return

        # 绘制所有标注框，使用各自标签的颜色
        if self.annotations:
            for i, annot in enumerate(self.annotations):
                try:
                    # 检查标注数据的有效性
                    if not isinstance(annot, dict) or "box" not in annot or "class" not in annot:
                        logger.warning(f"无效的标注数据: {annot}")
                        continue

                    x1, y1, x2, y2 = annot["box"]
                    x1_scaled = x1 * scale_x + pixmap_x
                    y1_scaled = y1 * scale_y + pixmap_y
                    x2_scaled = x2 * scale_x + pixmap_x
                    y2_scaled = y2 * scale_y + pixmap_y

                    # 获取该标签的颜色，使用优化的缓存
                    class_name = annot["class"]
                    r, g, b = self.get_class_color(class_name)

                    # 选中的框使用稍微亮一点的颜色
                    if i == self.current_box_idx:
                        r = min(255, int(r * 1.2))
                        g = min(255, int(g * 1.2))
                        b = min(255, int(b * 1.2))

                    color = QColor(r, g, b)
                    pen = QPen(color, 2)
                    painter.setPen(pen)
                    rect = QRect(int(x1_scaled), int(y1_scaled),
                                 int(x2_scaled - x1_scaled), int(y2_scaled - y1_scaled))
                    painter.drawRect(rect)

                    # 绘制类别标签，背景使用标签颜色
                    font = QFont()
                    font.setBold(True)
                    font.setPointSize(10)
                    painter.setFont(font)
                    # 使用QFontMetrics来准确计算文本宽度
                    font_metrics = painter.fontMetrics()

                    # 安全地处理confidence字段
                    if "confidence" in annot:
                        text = f"{annot['class']} ({annot['confidence']:.2f})"
                    else:
                        text = annot['class']

                    text_width = font_metrics.horizontalAdvance(text)
                    text_height = font_metrics.height()

                    # 确保文本框不会超出控件范围
                    text_x = max(0, int(x1_scaled))
                    text_y = max(0, int(y1_scaled) - text_height)
                    text_rect = QRect(text_x, text_y, text_width + 4, text_height)
                    painter.fillRect(text_rect, color)

                    # 根据背景亮度自动选择文字颜色
                    luminance = (r * 0.299 + g * 0.587 + b * 0.114)
                    text_color = QColor(0, 0, 0) if luminance > 127 else QColor(255, 255, 255)
                    painter.setPen(text_color)
                    painter.drawText(text_rect, Qt.AlignmentFlag.AlignCenter, text)
                except Exception as e:
                    logger.error(f"绘制标注时出错: {str(e)}")
                    continue

        # 如果有选中的框，绘制控制点
        try:
            if 0 <= self.current_box_idx < len(self.annotations):
                annot = self.annotations[self.current_box_idx]
                # 检查标注数据的有效性
                if isinstance(annot, dict) and "box" in annot:
                    x1, y1, x2, y2 = annot["box"]
                    x1_scaled = x1 * scale_x + pixmap_x
                    y1_scaled = y1 * scale_y + pixmap_y
                    x2_scaled = x2 * scale_x + pixmap_x
                    y2_scaled = y2 * scale_y + pixmap_y

                    # 绘制四个角的控制点，使用黄色
                    control_size = 8
                    points = [
                        (x1_scaled, y1_scaled),  # top-left
                        (x2_scaled, y1_scaled),  # top-right
                        (x1_scaled, y2_scaled),  # bottom-left
                        (x2_scaled, y2_scaled)  # bottom-right
                    ]

                    painter.setPen(QPen(QColor(255, 255, 0), 2))
                    painter.setBrush(QColor(255, 255, 255))
                    for (x, y) in points:
                        # 确保坐标有效
                        try:
                            painter.drawEllipse(int(x - control_size / 2), int(y - control_size / 2),
                                                control_size, control_size)
                        except Exception:
                            logger.warning(f"绘制控制点失败: ({x}, {y})")
        except Exception as e:
            logger.error(f"绘制控制点时出错: {str(e)}")

    def mousePressEvent(self, event):
        """鼠标按下事件，用于选择和拖动标注框"""
        if self.q_image is None or not self.annotations:
            return super().mousePressEvent(event)

        pos = event.pos()
        pixmap = self.pixmap()
        if pixmap.isNull():
            return None

        # 计算图片在 QLabel 中的偏移量（居中显示时的偏移）
        pixmap_x = (self.width() - pixmap.width()) // 2
        pixmap_y = (self.height() - pixmap.height()) // 2

        # 计算缩放比例
        scale_x = pixmap.width() / self.image.shape[1]
        scale_y = pixmap.height() / self.image.shape[0]
        inv_scale_x = 1 / scale_x
        inv_scale_y = 1 / scale_y

        # 检查是否点击了某个标注框
        self.current_box_idx = -1
        self.drag_handle = None

        for i, annot in enumerate(self.annotations):
            x1, y1, x2, y2 = annot["box"]
            x1_scaled = x1 * scale_x + pixmap_x
            y1_scaled = y1 * scale_y + pixmap_y
            x2_scaled = x2 * scale_x + pixmap_x
            y2_scaled = y2 * scale_y + pixmap_y

            # 检查是否点击了控制点
            control_size = 10
            handles = [
                (x1_scaled, y1_scaled, 'top_left'),
                (x2_scaled, y1_scaled, 'top_right'),
                (x1_scaled, y2_scaled, 'bottom_left'),
                (x2_scaled, y2_scaled, 'bottom_right')
            ]

            for (hx, hy, handle) in handles:
                if (abs(pos.x() - hx) <= control_size and
                        abs(pos.y() - hy) <= control_size):
                    self.current_box_idx = i
                    self.drag_handle = handle
                    self.last_pos = pos
                    self.dragging = True
                    self.update()
                    return None

            # 检查是否点击了框内部
            if (x1_scaled <= pos.x() <= x2_scaled and
                    y1_scaled <= pos.y() <= y2_scaled):
                self.current_box_idx = i
                self.drag_handle = 'center'
                self.last_pos = pos
                self.box_offset = QPoint(
                    int(pos.x() - x1_scaled),
                    int(pos.y() - y1_scaled)
                )
                self.dragging = True
                self.update()
                return None

        super().mousePressEvent(event)
        return None

    def mouseMoveEvent(self, event):
        """鼠标移动事件，用于拖动标注框"""
        if not self.dragging or self.current_box_idx < 0 or self.current_box_idx >= len(self.annotations):
            return super().mouseMoveEvent(event)

        pos = event.pos()
        pixmap = self.pixmap()
        if pixmap.isNull():
            return None

        # 计算图片在 QLabel 中的偏移量（居中显示时的偏移）
        pixmap_x = (self.width() - pixmap.width()) // 2
        pixmap_y = (self.height() - pixmap.height()) // 2

        # 计算缩放比例
        scale_x = pixmap.width() / self.image.shape[1]
        scale_y = pixmap.height() / self.image.shape[0]
        inv_scale_x = 1 / scale_x
        inv_scale_y = 1 / scale_y

        annot = self.annotations[self.current_box_idx]
        x1, y1, x2, y2 = annot["box"]
        new_x1, new_y1, new_x2, new_y2 = (x1, y1, x2, y2)  # 默认保持原值
        if self.drag_handle == 'center':
            # 整体移动
            dx = (pos.x() - self.last_pos.x()) * inv_scale_x
            dy = (pos.y() - self.last_pos.y()) * inv_scale_y

            new_x1 = x1 + dx
            new_y1 = y1 + dy
            new_x2 = x2 + dx
            new_y2 = y2 + dy

        elif self.drag_handle == 'top_left':
            # 左上角
            new_x1 = (pos.x() - pixmap_x) * inv_scale_x
            new_y1 = (pos.y() - pixmap_y) * inv_scale_y
            new_x2 = x2
            new_y2 = y2

        elif self.drag_handle == 'top_right':
            # 右上角
            new_x1 = x1
            new_y1 = (pos.y() - pixmap_y) * inv_scale_y
            new_x2 = (pos.x() - pixmap_x) * inv_scale_x
            new_y2 = y2

        elif self.drag_handle == 'bottom_left':
            # 左下角
            new_x1 = (pos.x() - pixmap_x) * inv_scale_x
            new_y1 = y1
            new_x2 = x2
            new_y2 = (pos.y() - pixmap_y) * inv_scale_y

        elif self.drag_handle == 'bottom_right':
            # 右下角
            new_x1 = x1
            new_y1 = y1
            new_x2 = (pos.x() - pixmap_x) * inv_scale_x
            new_y2 = (pos.y() - pixmap_y) * inv_scale_y

        # 确保坐标有效且在图像范围内
        img_width = self.image.shape[1]
        img_height = self.image.shape[0]

        # 保证坐标在有效范围内
        new_x1 = max(0, min(new_x1, img_width))
        new_y1 = max(0, min(new_y1, img_height))
        new_x2 = max(0, min(new_x2, img_width))
        new_y2 = max(0, min(new_y2, img_height))

        # 保证左上角坐标小于右下角坐标
        if new_x1 > new_x2:
            new_x1, new_x2 = new_x2, new_x1
        if new_y1 > new_y2:
            new_y1, new_y2 = new_y2, new_y1

        # 避免框的宽高为0
        if new_x1 == new_x2:
            if new_x1 > 0:
                new_x1 -= 1
            else:
                new_x2 += 1
        if new_y1 == new_y2:
            if new_y1 > 0:
                new_y1 -= 1
            else:
                new_y2 += 1

        # 更新标注框
        self.annotations[self.current_box_idx]["box"] = (new_x1, new_y1, new_x2, new_y2)
        self.last_pos = pos

        # 标记正在进行拖拽操作
        self.during_drag_operation = True

        # 只更新界面，不发送信号
        self.update()
        return None

    def update_annotation_area(self, old_x1, old_y1, old_x2, old_y2, new_x1, new_y1, new_x2, new_y2, scale_x, scale_y, pixmap_x, pixmap_y):
        """只更新标注框区域以提高性能"""
        # 计算旧框和新框的屏幕坐标
        old_x1_scaled = old_x1 * scale_x + pixmap_x
        old_y1_scaled = old_y1 * scale_y + pixmap_y
        old_x2_scaled = old_x2 * scale_x + pixmap_x
        old_y2_scaled = old_y2 * scale_y + pixmap_y

        new_x1_scaled = new_x1 * scale_x + pixmap_x
        new_y1_scaled = new_y1 * scale_y + pixmap_y
        new_x2_scaled = new_x2 * scale_x + pixmap_x
        new_y2_scaled = new_y2 * scale_y + pixmap_y

        # 计算需要更新的区域（包括旧框和新框）
        update_x1 = int(min(old_x1_scaled, new_x1_scaled) - 10)
        update_y1 = int(min(old_y1_scaled, new_y1_scaled) - 10)
        update_x2 = int(max(old_x2_scaled, new_x2_scaled) + 10)
        update_y2 = int(max(old_y2_scaled, new_y2_scaled) + 10)

        # 更新指定区域
        self.update(update_x1, update_y1, update_x2 - update_x1, update_y2 - update_y1)

    def mouseReleaseEvent(self, event):
        """鼠标释放事件"""
        self.dragging = False

        # 拖拽结束，发送更新信号并重置标志
        if self.during_drag_operation:
            self.during_drag_operation = False
            self.annotation_updated.emit(self.annotations)

        super().mouseReleaseEvent(event)

    def resizeEvent(self, event):
        """窗口大小改变事件"""
        if self.q_image:
            # 修正Qt.KeepAspectRatio和Qt.SmoothTransformation的引用
            self.setPixmap(QPixmap.fromImage(self.q_image).scaled(
                self.size(), Qt.AspectRatioMode.KeepAspectRatio, Qt.TransformationMode.SmoothTransformation))
        super().resizeEvent(event)
        # 触发重绘以确保标注框正确显示
        self.update()

    def contextMenuEvent(self, event):
        """右键菜单事件，用于删除标注框或修改标签"""
        if self.current_box_idx < 0 or self.current_box_idx >= len(self.annotations):
            return super().contextMenuEvent(event)

        # 创建上下文菜单
        menu = QMenu(self)

        # 修改标签动作
        modify_action = menu.addAction("修改标签")
        # 删除标注动作
        delete_action = menu.addAction("删除此标注")

        # 执行选中的动作
        action = menu.exec(self.mapToGlobal(event.pos()))
        if action == modify_action:
            self.modify_annotation_label()
        elif action == delete_action:
            self.delete_annotation()
        return None

    def modify_annotation_label(self):
        """修改标注标签"""
        if not self.class_names:
            QMessageBox.warning(self, "警告", "没有可用的标签，请先在项目设置中添加标签")
            return

        current_label = self.annotations[self.current_box_idx]["class"]
        # 从项目标签列表中选择
        label, ok = QInputDialog.getItem(
            self, "修改标签", "请选择标签:",
            self.class_names, self.class_names.index(current_label) if current_label in self.class_names else 0,
            False)

        if ok and label:
            self.annotations[self.current_box_idx]["class"] = label
            # 更新类别ID
            if label in self.class_names:
                self.annotations[self.current_box_idx]["class_id"] = self.class_names.index(label)
            self.update()
            self.annotation_updated.emit(self.annotations)

    def delete_annotation(self):
        """删除标注"""
        del self.annotations[self.current_box_idx]
        self.current_box_idx = -1
        self.update()
        self.annotation_updated.emit(self.annotations)