first commit

2024-12-12 17:05:39 +08:00 · 2024-12-12 17:05:39 +08:00 · 1dadf70601
commit 1dadf70601
10 changed files with 343 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,16 @@
+*.log
+*.log.*
+*.bak
+logs
+**/target
+.idea/
+*.class
+*.manifest
+*.spec
+.DS_Store
+
+
+
+
+
+
--- a/dataset/1014072304_0724045231.jpg
+++ b/dataset/1014072304_0724045231.jpg
--- a/dataset/1024072305_0724123756.jpg
+++ b/dataset/1024072305_0724123756.jpg
--- a/dataset/1024072305_0724123822.jpg
+++ b/dataset/1024072305_0724123822.jpg
--- a/dataset/1024072305_0724123933.jpg
+++ b/dataset/1024072305_0724123933.jpg
--- a/model/sishu_middle_24_12.onnx
+++ b/model/sishu_middle_24_12.onnx
--- a/model/sishu_thin_24_12.onnx
+++ b/model/sishu_thin_24_12.onnx
--- a/readme.md
+++ b/readme.md
@ -0,0 +1,28 @@
+## 简介
+本项目主要用于实现智能标注，支持本地标注的测试和web标注的服务提供。’
+## model 
+model 目录用于存放训练好的模型，以及模型对应的配置文件。
+
+## dataset
+dataset 目录用于存放测试数据集。
+
+## output
+output 目录用于存放含有标注结果的图片。
+
+## logs
+logs 目录用于存放标注过程中产生的日志文件。每个日志文件最大10MB，最多保留5个文件。
+
+## 文件说明
+sishu_label_local.py 为本地标注的测试代码，目的是将dataset里的丝束的图片进行标注，并将标注结果包括标签和矩形框保存到output目录下。
+sishu_label_web.py 为web标注的服务提供代码，目的是根据传入的网络图像路径按照传入的标签进行标注，返回标注结果。
+
+
+## 启动sishu_label_local的方法
+python sishu_label_local.py
+
+## 启动sishu_label_web的方法
+单进程启动：
+uvicorn sishu_label_web:app --reload --host '0.0.0.0' --port 8081
+
+多进程启动：
+uvicorn sishu_label_web:app --host 0.0.0.0 --port 8081 --workers 5 
--- a/sishu_label_local.py
+++ b/sishu_label_local.py
@ -0,0 +1,130 @@
+import os
+from ultralytics import YOLO
+import cv2
+import random
+
+def generate_label_colors(labels):
+    """为每个标签生成固定颜色（红色，黄色，蓝色，绿色）"""
+    colors = {
+        "red": (255, 0, 0),
+        "yellow": (255, 255, 0),
+        "blue": (0, 0, 255),
+        "green": (0, 255, 0),
+    }
+    # 为标签分配颜色，确保颜色在红、黄、蓝、绿之间循环
+    label_colors = {}
+    color_list = list(colors.values())
+    for i, label in enumerate(labels):
+        print(f"generate_label_colors, label: {label}")
+        label_colors[label] = color_list[i % len(color_list)]  # 循环分配颜色
+
+    return label_colors
+
+def intelligent_annotation_with_filter(model_path, input_folder, output_folder, target_labels, conf_threshold=0.3):
+    """
+    使用 YOLOv8 模型对本地文件夹图像进行智能标注，并按指定标签过滤输出。
+
+    :param model_path: YOLOv8 模型文件路径
+    :param input_folder: 输入文件夹路径，包含待标注的图像
+    :param output_folder: 输出文件夹路径，存储标注后的图像
+    :param target_labels: 用户指定需要标注的目标类别列表
+    :param conf_threshold: 置信度阈值，默认 0.5
+    """
+    # 加载 YOLO 模型
+    model = YOLO(model_path)
+
+    # 获取所有可能的标签
+    all_labels = model.names.values()
+    print("所有可能的标签：", all_labels)
+    label_colors = generate_label_colors(all_labels)
+    print("所有可能的标签对应的颜色：", label_colors)
+
+    # 保存标注结果的字典
+    annotation_results = {}
+
+    # 创建输出文件夹（如果不存在）
+    os.makedirs(output_folder, exist_ok=True)
+
+    # 遍历输入文件夹中的所有图像
+    for file_name in os.listdir(input_folder):
+        input_path = os.path.join(input_folder, file_name)
+
+        # 检查文件是否是图像格式
+        if not (file_name.endswith('.jpg') or file_name.endswith('.png') or file_name.endswith('.jpeg')):
+            continue
+
+        # 模型预测
+        results = model(input_path, task="detect", conf=conf_threshold)
+
+        image_annotations = []  # 当前图像的标注信息
+
+        # 读取原始图像
+        image = cv2.imread(input_path)
+
+        # 获取图像尺寸
+        image_height, image_width = image.shape[:2]
+
+        # 标注的标志，检查是否有符合的目标
+        has_annotation = False
+
+        # 遍历预测结果
+        for result in results:
+            for box in result.boxes:
+                # 提取边界框信息和分类标签
+                x1, y1, x2, y2 = map(int, box.xyxy[0])  # 坐标转换为整数
+                label = model.names[int(box.cls[0])]    # 类别名称
+                print(f"label:" + label)
+                conf = box.conf[0]                     # 置信度
+
+                # 检查是否为目标标签
+                if label in target_labels:
+                    color = label_colors[label]  # 获取对应标签的颜色
+                    has_annotation = True
+
+                    # 绘制边界框
+                    # color = (0, 255, 0)  # 绿色
+                    # 随机生成颜色
+                    # color = tuple(random.randint(0, 255) for _ in range(3))  # 生成随机颜色
+                    cv2.rectangle(image, (x1, y1), (x2, y2), color, 2)
+
+                    # 在边界框上方绘制标签和置信度
+                    label_text = f"{label} {conf:.2f}"
+                    print(f"label_text:" + label_text)
+                    cv2.putText(image, label_text, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 2, color, 1)
+
+                    # 转换为归一化坐标并保存
+                    normalized_x = x1 / image_width
+                    normalized_y = y1 / image_height
+                    normalized_width = (x2 - x1) / image_width
+                    normalized_height = (y2 - y1) / image_height
+
+                    annotation = {
+                        "label": label,
+                        "x": normalized_x * 100,
+                        "y": normalized_y * 100,
+                        "width": normalized_width * 100,
+                        "height": normalized_height * 100,
+                    }
+                    image_annotations.append(annotation)
+
+                # 保存标注信息到结果字典
+        annotation_results[input_path] = image_annotations if image_annotations else []
+
+        # 如果存在符合的标注目标，保存标注后的图像
+        if has_annotation:
+            output_path = os.path.join(output_folder, file_name)
+            cv2.imwrite(output_path, image)
+
+    print(f"智能标注完成！标注后的图像保存在：{output_folder}")
+    return annotation_results
+
+model_path = "./model/sishu_thin_24_12.onnx"  # 你的YOLOv8模型权重路径
+input_folder = "./dataset"  # 输入文件夹路径
+output_folder = "./output"  # 输出文件夹路径
+target_labels = ["tiaojuan", "zhujiesi", "yulinwen"]  # 用户指定的目标标签
+annotation_results = intelligent_annotation_with_filter(model_path, input_folder, output_folder, target_labels)
+print(f"标注结果：annotation_results：{annotation_results}")
+
+print(f"标注结果：./dataset/1024072305_0724123933.jpg annotation_results：{annotation_results['./dataset/1024072305_0724123933.jpg']}")
+
+
--- a/sishu_label_web.py
+++ b/sishu_label_web.py
@ -0,0 +1,169 @@
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+from typing import List, Optional
+import cv2
+from ultralytics import YOLO
+import requests
+import numpy as np
+import time
+from contextlib import asynccontextmanager
+import logging
+import os
+from logging.handlers import RotatingFileHandler
+from urllib.parse import urlparse
+
+# 设置日志配置
+log_dir = "logs"
+os.makedirs(log_dir, exist_ok=True)
+
+# 配置日志
+log_file = os.path.join(log_dir, "app.log")
+logger = logging.getLogger("Sishu_AI_Annotation")
+logger.setLevel(logging.DEBUG)
+
+# 设置文件回滚，每个日志文件最大10MB，最多保留5个文件
+handler = RotatingFileHandler(log_file, maxBytes=10 * 1024 * 1024, backupCount=5)
+formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
+handler.setFormatter(formatter)
+logger.addHandler(handler)
+
+@asynccontextmanager
+async def app_lifespan(app: FastAPI):
+    """定义应用的生命周期事件"""
+    global model
+    logger.info("正在加载模型...")
+    model = YOLO("./model/sishu_thin_24_12.onnx")  # 加载YOLO模型
+    logger.info("模型加载完成")
+    yield  # 生命周期的运行阶段
+    # 在这里可以执行任何必要的清理操作
+
+# FastAPI应用
+app = FastAPI(lifespan=app_lifespan)
+
+# 定义请求参数模型
+class AnnotateRequest(BaseModel):
+    image_urls: List[str]  # 图片的网络路径列表
+    target_labels: Optional[List[str]] = None  # 标签列表
+    conf_threshold: Optional[float] = 0.3 # 模型推理的阈值
+
+# 为每个标签生成固定颜色（红色，黄色，蓝色，绿色）
+def generate_label_colors(labels):
+    colors = {
+        "red": (255, 0, 0),
+        "yellow": (255, 255, 0),
+        "blue": (0, 0, 255),
+        "green": (0, 255, 0),
+    }
+    label_colors = {}
+    color_list = list(colors.values())
+    for i, label in enumerate(labels):
+        label_colors[label] = color_list[i % len(color_list)]  # 循环分配颜色
+
+    return label_colors
+
+
+# 通过URL加载图像
+def load_image_from_url(image_url):
+    try:
+        response = requests.get(image_url)
+        response.raise_for_status()
+        image_array = np.frombuffer(response.content, np.uint8)
+        image = cv2.imdecode(image_array, cv2.IMREAD_COLOR)
+
+        if image is None:
+            logger.error(f"无法解码图像：{image_url}")
+            return None
+
+        return image
+    except requests.exceptions.RequestException as e:
+        logger.error(f"请求失败: {e}")
+        return None
+
+
+# 对图像进行智能标注
+def annotate_images(model, image_urls, target_labels=None, conf_threshold=0.1):
+    annotation_results = {}
+    all_labels = model.names.values()
+    label_colors = generate_label_colors(all_labels)
+
+    for image_url in image_urls:
+        # 假设 image_path 可能是一个 URL 或者本地路径
+        if image_url.startswith("http"):
+            # 如果是URL，加载在线图片
+            start_time = time.time()  # 记录开始时间
+            image = load_image_from_url(image_url)
+            end_time = time.time()  # 记录结束时间
+            load_time = end_time - start_time
+            logger.debug(f"加载图像 {image_url} 的时间: {load_time:.3f} 秒")
+        else:
+            # 如果是本地路径，使用cv2读取
+            image = cv2.imread(image_url)
+
+        if image is None:
+            logger.error(f"无法读取图像：{image_url}")
+            continue
+
+        image_height, image_width = image.shape[:2]
+        results = model(image, task="detect", conf=conf_threshold)
+
+        image_annotations = []
+
+        path = urlparse(image_url).path
+        file_name = os.path.basename(path)
+
+        for result in results:
+            for box in result.boxes:
+                x1, y1, x2, y2 = map(int, box.xyxy[0])
+                label = model.names[int(box.cls[0])]
+                conf = box.conf[0]
+
+                if target_labels is None or label in target_labels:
+                    color = label_colors[label]
+
+                    cv2.rectangle(image, (x1, y1), (x2, y2), color, 2)
+                    label_text = f"{label} {conf:.2f}"
+                    cv2.putText(image, label_text, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.6, color, 2)
+
+                    normalized_x = x1 / image_width
+                    normalized_y = y1 / image_height
+                    normalized_width = (x2 - x1) / image_width
+                    normalized_height = (y2 - y1) / image_height
+
+                    annotation = {
+                        "label": label,
+                        "x": normalized_x * 100,
+                        "y": normalized_y * 100,
+                        "width": normalized_width * 100,
+                        "height": normalized_height * 100,
+                    }
+                    image_annotations.append(annotation)
+
+        annotation_results[image_url] = image_annotations if image_annotations else []                    # 保存标注后的图像
+        output_path = os.path.join("./output", os.path.basename(image_url))
+        cv2.imwrite(output_path, image)
+        logger.info("图片路径：{}".format(output_path))
+
+
+    return annotation_results
+
+# FastAPI端点 - 图像标注接口
+@app.post("/annotate")
+async def annotate(request: AnnotateRequest):
+    try:
+        logger.info("开始处理请求: %s", request.dict())
+        annotation_results = annotate_images(
+            model=model,
+            image_urls=request.image_urls,
+            target_labels=request.target_labels,
+            conf_threshold=request.conf_threshold
+        )
+        logger.info("请求处理完成")
+        logger.info("annotations:{}", annotation_results)
+        return {"annotations": annotation_results}
+
+    except Exception as e:
+        logger.error(f"发生错误: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+# 示例用法: 调用接口时会返回JSON格式的标注结果，包含图片的路径和标注信息。