Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 3 additions & 2 deletions .github/workflows/_e2e_nightly_multi_node.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -101,15 +101,16 @@ jobs:
- name: Decode kubeconfig from secrets
run: |
# Decode and save kubeconfig
echo "${{ secrets.KUBECONFIG_B64 }}" | base64 -d > $KUBECONFIG
# echo "${{ secrets.KUBECONFIG_B64 }}" | base64 -d > $KUBECONFIG
cp /root/.cache/.kube/kubeconfig.yaml $KUBECONFIG

- name: Checkout code
uses: actions/checkout@v6

- name: Prepare scripts
run: |
# prepare for lws entrypoint scripts
install -D tests/e2e/nightly/multi_node/scripts/run.sh /root/.cache/tests/run.sh
# install -D tests/e2e/nightly/multi_node/scripts/run.sh /root/.cache/tests/run.sh
# clear log directory
rm -fr $RESULT_FILE

Expand Down
78 changes: 39 additions & 39 deletions .github/workflows/nightly_test_a3.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -27,8 +27,8 @@ on:
workflow_dispatch:
pull_request:
branches:
- 'main'
types: [ labeled ]
- 'releases/*'
# types: [ labeled ]

# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
# declared as "shell: bash -el {0}" on steps that need to be properly activated.
Expand All @@ -44,51 +44,51 @@ concurrency:
jobs:
multi-node-tests:
name: multi-node
if: always() && (github.event_name == 'schedule' || github.event_name == 'workflow_dispatch')
# if: always() && (github.event_name == 'schedule' || github.event_name == 'workflow_dispatch')
strategy:
fail-fast: false
max-parallel: 1
matrix:
test_config:
- name: multi-node-deepseek-pd
config_file_path: DeepSeek-V3.yaml
size: 2
- name: multi-node-qwen3-dp
config_file_path: Qwen3-235B-A22B.yaml
size: 2
# - name: multi-node-dpsk-4node-pd
# config_file_path: DeepSeek-R1-W8A8.yaml
# size: 4
- name: multi-node-qwenw8a8-2node
config_file_path: Qwen3-235B-W8A8.yaml
size: 2
# - name: multi-node-deepseek-r1-w8a8-eplb
# config_file_path: DeepSeek-R1-W8A8-EPLB.yaml
# size: 4
- name: multi-node-qwenw8a8-2node-eplb
config_file_path: Qwen3-235B-W8A8-EPLB.yaml
size: 2
# - name: multi-node-deepseek-pd
# config_file_path: DeepSeek-V3.yaml
# size: 2
# - name: multi-node-qwen3-dp
# config_file_path: Qwen3-235B-A22B.yaml
# size: 2
# # - name: multi-node-dpsk-4node-pd
# # config_file_path: DeepSeek-R1-W8A8.yaml
# # size: 4
# - name: multi-node-qwenw8a8-2node
# config_file_path: Qwen3-235B-W8A8.yaml
# size: 2
# # - name: multi-node-deepseek-r1-w8a8-eplb
# # config_file_path: DeepSeek-R1-W8A8-EPLB.yaml
# # size: 4
# - name: multi-node-qwenw8a8-2node-eplb
# config_file_path: Qwen3-235B-W8A8-EPLB.yaml
# size: 2
- name: multi-node-dpsk3.2-2node
config_file_path: DeepSeek-V3_2-W8A8-A3-dual-nodes.yaml
size: 2
- name: multi-node-deepseek-r1-w8a8-longseq
config_file_path: DeepSeek-R1-W8A8-longseq.yaml
size: 2
- name: multi-node-qwenw8a8-2node-longseq
config_file_path: Qwen3-235B-W8A8-longseq.yaml
size: 2
- name: multi-node-qwen-disagg-pd
config_file_path: Qwen3-235B-disagg-pd.yaml
size: 2
- name: multi-node-qwen-vl-disagg-pd
config_file_path: Qwen3-VL-235B-disagg-pd.yaml
size: 2
- name: multi-node-kimi-k2-instruct-w8a8
config_file_path: Kimi-K2-Instruct-W8A8.yaml
size: 2
- name: multi-node-deepseek-v3.1
config_file_path: DeepSeek-V3.1-BF16.yaml
size: 2
# - name: multi-node-deepseek-r1-w8a8-longseq
# config_file_path: DeepSeek-R1-W8A8-longseq.yaml
# size: 2
# - name: multi-node-qwenw8a8-2node-longseq
# config_file_path: Qwen3-235B-W8A8-longseq.yaml
# size: 2
# - name: multi-node-qwen-disagg-pd
# config_file_path: Qwen3-235B-disagg-pd.yaml
# size: 2
# - name: multi-node-qwen-vl-disagg-pd
# config_file_path: Qwen3-VL-235B-disagg-pd.yaml
# size: 2
# - name: multi-node-kimi-k2-instruct-w8a8
# config_file_path: Kimi-K2-Instruct-W8A8.yaml
# size: 2
# - name: multi-node-deepseek-v3.1
# config_file_path: DeepSeek-V3.1-BF16.yaml
# size: 2
uses: ./.github/workflows/_e2e_nightly_multi_node.yaml
with:
soc_version: a3
Expand Down
Loading