main
HuangHai 4 weeks ago
parent 83f0f949f1
commit e42609c5f6

@ -21,3 +21,8 @@ MODEL_NAME = "qwen-plus"
# Jieba分词自定义词典配置 # Jieba分词自定义词典配置
JIEBA_CUSTOM_WORDS = ['文言虚词', '花呗'] JIEBA_CUSTOM_WORDS = ['文言虚词', '花呗']
# 腾讯 AI Lab 中文词向量模型的路径
MODEL_PATH = "D:/Tencent_AILab_ChineseEmbedding/Tencent_AILab_ChineseEmbedding.txt"
# 加载词向量模型时限制的词汇数量
MODEL_LIMIT = 10000

@ -1 +1 @@
http://localhost:8000/static/index.html http://10.10.21.22:8000/static/index.html

@ -2,10 +2,9 @@ import logging
import os import os
from logging.handlers import RotatingFileHandler from logging.handlers import RotatingFileHandler
import jieba import jieba
from elasticsearch import Elasticsearch
from gensim.models import KeyedVectors from gensim.models import KeyedVectors
from Config.Config import MS_MODEL_PATH, MS_MODEL_LIMIT
from Config.Config import MODEL_LIMIT, MODEL_PATH
from ElasticSearch.Utils.ElasticsearchConnectionPool import ElasticsearchConnectionPool from ElasticSearch.Utils.ElasticsearchConnectionPool import ElasticsearchConnectionPool
# 初始化日志 # 初始化日志
@ -49,7 +48,7 @@ class EsSearchUtil:
# 加载预训练模型 # 加载预训练模型
self.model = KeyedVectors.load_word2vec_format(MS_MODEL_PATH, binary=False, limit=MS_MODEL_LIMIT) self.model = KeyedVectors.load_word2vec_format(MODEL_PATH, binary=False, limit=MODEL_LIMIT)
logger.info(f"模型加载成功,词向量维度: {self.model.vector_size}") logger.info(f"模型加载成功,词向量维度: {self.model.vector_size}")
# 初始化Elasticsearch连接 # 初始化Elasticsearch连接

Loading…
Cancel
Save