优化

be610aa6 · zhengyaoqiu · 324f97a4 · be610aa6 · be610aa6 · be610aa6
Commit be610aa6 authored May 30, 2025 by zhengyaoqiu
Hide whitespace changes
Inline Side-by-side

Showing with 13 additions and 10 deletions

feature_extractor.py app/services/feature_extractor.py +7 -5

image_upload.py app/services/image_upload.py +4 -4

test_milvus.py tests/test_milvus.py +2 -1

No files found.
--- a/app/services/feature_extractor.py
+++ b/app/services/feature_extractor.py
@@ -10,19 +10,19 @@ class FeatureExtractor:
    __logger = logging.getLogger(__name__)

    device = "cuda" if torch.cuda.is_available() else "cpu"
-    def __init__(self, device = "xpu" if torch.xpu.is_available() else "cpu", model_name = "ViT-B/32"):
+    def __init__(self, device = "xpu" if torch.xpu.is_available() else "cpu", model_name = "ViT-L/14@336px"):
        device = "cpu"
        self.model, self.preprocess = self.init_model(device, model_name)
        self.device = device

    @staticmethod
-    def init_model(device="xpu" if torch.xpu.is_available() else "cpu", model_name="ViT-B/32"):
+    def init_model(device="xpu" if torch.xpu.is_available() else "cpu", model_name="ViT-L/14@336px"):
        print(f"创建并初始化 CLIP 模型: {model_name} 在设备: {device}")
        model, preprocess = clip.load(model_name, device=device)
        return model, preprocess

    @staticmethod
-    def resize_with_padding(img, target_size = (224, 224)):
+    def resize_with_padding(img, target_size = (336, 336)):
        """
        调整图像大小，保持纵横比并添加填充

@@ -97,7 +97,7 @@ class FeatureExtractor:

        # device = "xpu" if torch.xpu.is_available() else "cpu"
        # device = "cpu"
-        # model_name = "ViT-B/32"
+        # model_name = "ViT-L/14@336px"
        # model, preprocess = self.init_model(device, model_name)

        try:
@@ -113,7 +113,9 @@ class FeatureExtractor:
                # 归一化特征向量
                image_features /= image_features.norm(dim=-1, keepdim=True)

-            return image_features.cpu().numpy().astype(np.float32).flatten()
+                result = image_features.cpu().numpy().astype(np.float32).flatten()
+                # ViT-L/14@336px 需要转换列表结构
+                return result.tolist()

        except Exception as e:
            self.__logger.error(f"Error extracting features from image: {e}")

--- a/app/services/image_upload.py
+++ b/app/services/image_upload.py
@@ -13,12 +13,12 @@ class ImageUpload:
    def upload_many(self, bucket, image2keys):
        keys = []
        vectors = []
-
-        images = [image2key["image"] for image2key in image2keys]
-        new_images, exist_images = self.milvus.filter_new_urls(bucket, images)
        images = []

-        print(f"总图片数: {len(images)}")
+        all_images = [image2key["image"] for image2key in image2keys]
+        new_images, exist_images = self.milvus.filter_new_urls(bucket, all_images)
+
+        print(f"总图片数: {len(all_images)}")
        print(f"新图片数: {len(new_images)}")
        print(f"已存在图片数: {len(exist_images)}")
        print(f"新图片: {new_images}")

--- a/tests/test_milvus.py
+++ b/tests/test_milvus.py
@@ -11,7 +11,8 @@ class TestCreateCollectionFunction(unittest.TestCase):
        fields: List[FieldSchema] = [
            FieldSchema(name="image", dtype=DataType.VARCHAR, max_length=256, is_primary=True, auto_id=False),
            FieldSchema(name="key", dtype=DataType.VARCHAR, max_length=256),
-            FieldSchema(name="vector", dtype=DataType.FLOAT_VECTOR, dim=512)  # CLIP ViT-B/32的特征维度为512
+            # FieldSchema(name="vector", dtype=DataType.FLOAT_VECTOR, dim=512)  # CLIP ViT-B/32的特征维度为512
+            FieldSchema(name="vector", dtype=DataType.FLOAT_VECTOR, dim=768)  # CLIP ViT-L/14@336px的特征维度为512
        ]
        MilvusClient().connect().create_collection("pc3", fields, "PC3 图片向量存储")