Skip to content
Open
1 change: 1 addition & 0 deletions examples/run_qwen3.5_4b_dflash_online_npu.sh
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@ export SPECFORGE_DATA_NUM_PROC=64
ATTENTION_BACKEND=${2:-flex_attention}
NUM_GPUS=${1:-8}

# If OOM occurs on low-memory NPU devices, retry with a smaller --num-anchors value.
torchrun \
--standalone \
--nproc_per_node $NUM_GPUS \
Expand Down
3 changes: 2 additions & 1 deletion examples/run_qwen3.5_4b_domino_online_npu.sh
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,7 @@ NUM_DEVICES=$(echo "$NPU_DEVICES" | tr ',' '\n' | wc -l)
export ASCEND_RT_VISIBLE_DEVICES=$NPU_DEVICES
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:32

# If OOM occurs on low-memory NPU devices, retry with a smaller --num-anchors value.
torchrun \
--standalone \
--nproc_per_node "$NUM_DEVICES" \
Expand All @@ -37,7 +38,7 @@ torchrun \
--max-length 1024 \
--chat-template qwen3.5 \
--attention-backend sdpa \
--num-anchors 16 \
--num-anchors 256 \
--loss-decay-gamma 7.0 \
--log-interval 50 \
--save-interval 3000 \
Expand Down
Loading