4 lines
117 B
YAML
4 lines
117 B
YAML
|
model_dir: /home/colin/.cache/modelscope/hub/qwen/Qwen-1_8B-Chat
|
||
|
learning_rate: 0.0001
|
||
|
use_tril_attention_mask: null
|