kind: Container
metadata:
name: ms-swift-test
namespace: test
labels:
this: that
image: "us-docker.pkg.dev/agentsea-dev/orign/swift-trainer:latest"
command: |
CUDA_VISIBLE_DEVICES=0 \
MAX_PIXELS=1003520 \
swift sft \
--model Qwen/Qwen2-VL-7B-Instruct \
--dataset 'modelscope/coco_2014_caption:train#300' \
--train_type lora \
--torch_dtype bfloat16 \
--num_train_epochs 1 \
--per_device_train_batch_size 1 \
--per_device_eval_batch_size 1 \
--learning_rate 1e-4 \
--lora_rank 8 \
--lora_alpha 32 \
--target_modules all-linear \
--freeze_vit true \
--gradient_accumulation_steps 16 \
--eval_steps 100 \
--save_steps 100 \
--save_total_limit 5 \
--logging_steps 5 \
--max_length 2048 \
--output_dir /nebu/swift-test \
--warmup_ratio 0.05 \
--dataloader_num_workers 4
platform: runpod
env:
- key: HELLO
value: world
volumes:
- source: /nebu/swift-test
dest: s3://nebulous-rs/swift-test
driver: RCLONE_SYNC
continuous: true
accelerators:
- "1:A100_SXM"
meters:
- cost: 0.1
unit: second
metric: runtime
currency: USD
restart: Never