Files
bettafish-company/WeiboSentiment_SmallQwen/models_config.py
T

53 lines
1.4 KiB
Python

# -*- coding: utf-8 -*-
"""
Qwen3模型配置文件
定义不同规模的模型参数和配置
"""
# Qwen3模型配置
QWEN3_MODELS = {
"0.6B": {
"base_model": "Qwen/Qwen3-0.6B",
"embedding_model": "Qwen/Qwen3-Embedding-0.6B",
"embedding_dim": 1024,
"max_length": 32768,
"recommended_batch_size": 32,
"recommended_lr": 1e-3,
"lora_r": 16,
"lora_alpha": 32
},
"4B": {
"base_model": "Qwen/Qwen3-4B",
"embedding_model": "Qwen/Qwen3-Embedding-4B",
"embedding_dim": 2560,
"max_length": 32768,
"recommended_batch_size": 16,
"recommended_lr": 5e-4,
"lora_r": 32,
"lora_alpha": 64
},
"8B": {
"base_model": "Qwen/Qwen3-8B",
"embedding_model": "Qwen/Qwen3-Embedding-8B",
"embedding_dim": 4096,
"max_length": 32768,
"recommended_batch_size": 8,
"recommended_lr": 2e-4,
"lora_r": 64,
"lora_alpha": 128
}
}
# 模型文件路径配置
MODEL_PATHS = {
"embedding": {
"0.6B": "./models/qwen3_embedding_0.6b_sentiment.pth",
"4B": "./models/qwen3_embedding_4b_sentiment.pth",
"8B": "./models/qwen3_embedding_8b_sentiment.pth"
},
"lora": {
"0.6B": "./models/qwen3_lora_0.6b_final",
"4B": "./models/qwen3_lora_4b_final",
"8B": "./models/qwen3_lora_8b_final"
}
}