update code

This commit is contained in:
ZeYi Lin
2025-07-03 18:21:26 +08:00
parent db3a162cd8
commit 08a0fa8c3e
4 changed files with 8 additions and 8 deletions

View File

@@ -33,7 +33,7 @@ from transformers import (
import datetime
from transformers.testing_utils import CaptureLogger
from transformers.trainer_utils import get_last_checkpoint
import wandb
import swanlab
from tqdm import tqdm
@@ -183,8 +183,8 @@ def main():
parser = HfArgumentParser((ModelArguments, DataTrainingArguments, TrainingArguments))
model_args, data_args, training_args = parser.parse_args_into_dataclasses()
# 初始化 WandB
wandb.init(project="sft", name="qwen-1.5b")
# 初始化 SwanLab
swanlab.init(project="sft", name="qwen-1.5b")
# 设置日志
logging.basicConfig(

View File

@@ -22,6 +22,6 @@ deepspeed finetune.py \
--bf16 \
--gradient_checkpointing \
--deepspeed ./ds_config_zero2.json \
--report_to wandb
--report_to swanlab
# --resume_from_checkpoint ${output_model}/checkpoint-20400 \

View File

@@ -30,7 +30,7 @@ from transformers import (
import datetime
from transformers.testing_utils import CaptureLogger
from transformers.trainer_utils import get_last_checkpoint
import wandb
import swanlab
logger = logging.getLogger(__name__)
@@ -95,8 +95,8 @@ def main():
parser = HfArgumentParser((ModelArguments, DataTrainingArguments, TrainingArguments))
model_args, data_args, training_args = parser.parse_args_into_dataclasses()
# 初始化 WandB
wandb.init(project="pretrain", name="from_scrach")
# 初始化 SwanLab
swanlab.init(project="pretrain", name="from_scrach")
# 设置日志
logging.basicConfig(

View File

@@ -24,6 +24,6 @@ deepspeed pretrain.py \
--bf16 \
--gradient_checkpointing \
--deepspeed ./ds_config_zero2.json \
--report_to wandb
--report_to swanlab
# --resume_from_checkpoint ${output_model}/checkpoint-20400 \