完善了跳连接,在上decode块后增加特征精炼层,未测效果

This commit is contained in:
2026-01-09 18:23:45 +08:00
parent 500c2eb18f
commit 12de74f130
8 changed files with 893 additions and 244 deletions

View File

@@ -11,9 +11,10 @@ shift 2
# Default parameters
MODEL=${MODEL:-"SwiftFormerTemporal_XS"}
BATCH_SIZE=${BATCH_SIZE:-256}
BATCH_SIZE=${BATCH_SIZE:-128}
EPOCHS=${EPOCHS:-100}
LR=${LR:-1e-3}
# LR=${LR:-1e-3}
LR=${LR:-0.01}
OUTPUT_DIR=${OUTPUT_DIR:-"./temporal_output"}
echo "Starting distributed training with $NUM_GPUS GPUs"