From d373a073e457ce81ed681c93d549342893726cd9 Mon Sep 17 00:00:00 2001 From: liangguodong Date: Wed, 4 Feb 2026 15:22:13 +0800 Subject: [PATCH] =?UTF-8?q?feat:=20=E6=B7=BB=E5=8A=A0=E9=85=8D=E7=BD=AE?= =?UTF-8?q?=E6=96=87=E4=BB=B6=20config.ini?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .gitignore | 2 -- config.ini | 35 +++++++++++++++++++++++++++++++++++ 2 files changed, 35 insertions(+), 2 deletions(-) create mode 100644 config.ini diff --git a/.gitignore b/.gitignore index 23a6975..6427504 100644 --- a/.gitignore +++ b/.gitignore @@ -16,8 +16,6 @@ __pycache__/ *.swp *.swo -# Config with sensitive data -config.ini # Logs *.log diff --git a/config.ini b/config.ini new file mode 100644 index 0000000..d8f432c --- /dev/null +++ b/config.ini @@ -0,0 +1,35 @@ +[image] +cdn_base = http://images11.bxmkb.cn/Images/ + +[database] +host = localhost +port = 3306 +user = root +password = liang20020523 +database = ai_article +charset = utf8mb4 + +[dashvector] +api_key = sk-55x6oBXypSlPHQ8NvPHfyBABcMIMUE0407A0FCC2A11F0B9C802831A608ABB +endpoint = vrs-cn-2ml4jm42o0001r.dashvector.cn-hangzhou.aliyuncs.com +collection_name = image_vectors +# 多模态模型维度 1024 (multimodal-embedding-v1) +vector_dimension = 1024 + +[dashscope] +api_key = sk-d3f235925afa4e4e83d707dde04b9e52 + +[similarity] +# pHash 汉明距离阈值,<=5 视为完全相同 +phash_threshold = 5 +# 向量相似度阈值,>=0.94 视为重复 +vector_threshold = 0.94 + +[process] +# 每批处理数量 +batch_size = 100 +# 并发下载数 +concurrent_downloads = 10 +# 日志级别 +log_level = INFO +log_file = image_similarity.log