Local sentiment analysis upload.
This commit is contained in:
@@ -0,0 +1,53 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
"""
|
||||
Qwen3模型配置文件
|
||||
定义不同规模的模型参数和配置
|
||||
"""
|
||||
|
||||
# Qwen3模型配置
|
||||
QWEN3_MODELS = {
|
||||
"0.6B": {
|
||||
"base_model": "Qwen/Qwen3-0.6B",
|
||||
"embedding_model": "Qwen/Qwen3-Embedding-0.6B",
|
||||
"embedding_dim": 1024,
|
||||
"max_length": 32768,
|
||||
"recommended_batch_size": 32,
|
||||
"recommended_lr": 1e-3,
|
||||
"lora_r": 16,
|
||||
"lora_alpha": 32
|
||||
},
|
||||
"4B": {
|
||||
"base_model": "Qwen/Qwen3-4B",
|
||||
"embedding_model": "Qwen/Qwen3-Embedding-4B",
|
||||
"embedding_dim": 2560,
|
||||
"max_length": 32768,
|
||||
"recommended_batch_size": 16,
|
||||
"recommended_lr": 5e-4,
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 64
|
||||
},
|
||||
"8B": {
|
||||
"base_model": "Qwen/Qwen3-8B",
|
||||
"embedding_model": "Qwen/Qwen3-Embedding-8B",
|
||||
"embedding_dim": 4096,
|
||||
"max_length": 32768,
|
||||
"recommended_batch_size": 8,
|
||||
"recommended_lr": 2e-4,
|
||||
"lora_r": 64,
|
||||
"lora_alpha": 128
|
||||
}
|
||||
}
|
||||
|
||||
# 模型文件路径配置
|
||||
MODEL_PATHS = {
|
||||
"embedding": {
|
||||
"0.6B": "./models/qwen3_embedding_0.6b_sentiment.pth",
|
||||
"4B": "./models/qwen3_embedding_4b_sentiment.pth",
|
||||
"8B": "./models/qwen3_embedding_8b_sentiment.pth"
|
||||
},
|
||||
"lora": {
|
||||
"0.6B": "./models/qwen3_lora_0.6b_final",
|
||||
"4B": "./models/qwen3_lora_4b_final",
|
||||
"8B": "./models/qwen3_lora_8b_final"
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user