-
Notifications
You must be signed in to change notification settings - Fork 74
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
#8558: Refactor t3000, tg and tgg pipelines, workflows and run test s…
…cripts
- Loading branch information
Showing
26 changed files
with
862 additions
and
284 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,52 @@ | ||
name: "[T3K] T3000 demo tests" | ||
|
||
on: | ||
workflow_dispatch: | ||
schedule: | ||
- cron: '0 0 * * 6' # This cron schedule runs the workflow every Saturday at 12am UTC | ||
|
||
jobs: | ||
build-artifact: | ||
uses: ./.github/workflows/build-artifact.yaml | ||
with: | ||
arch: '["wormhole_b0"]' | ||
secrets: inherit | ||
t3000-demo-tests: | ||
needs: build-artifact | ||
strategy: | ||
fail-fast: false | ||
matrix: | ||
test-group: [ | ||
{ | ||
name: "T3000 demo tests", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-functional"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type demos_t3000_device --dispatch-mode ""' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: TTMetal_build_${{ matrix.test-group.arch }} | ||
- name: Extract files | ||
run: tar -xvf ttm_${{ matrix.test-group.arch }}.tar | ||
- uses: ./.github/actions/install-python-deps | ||
- name: Run demo regression tests | ||
timeout-minutes: 180 | ||
run: | | ||
source ${{ github.workspace }}/python_env/bin/activate | ||
cd $TT_METAL_HOME | ||
export PYTHONPATH=$TT_METAL_HOME | ||
${{ matrix.test-group.cmd }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,52 @@ | ||
name: "[T3K] T3000 frequent tests" | ||
|
||
on: | ||
workflow_dispatch: | ||
schedule: | ||
- cron: "0 */8 * * *" # This cron schedule runs the workflow every 8 hours | ||
|
||
jobs: | ||
build-artifact: | ||
uses: ./.github/workflows/build-artifact.yaml | ||
with: | ||
arch: '["wormhole_b0"]' | ||
secrets: inherit | ||
t3000-frequent-tests: | ||
needs: build-artifact | ||
strategy: | ||
fail-fast: false | ||
matrix: | ||
test-group: [ | ||
{ | ||
name: "T3000 frequent tests", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-functional"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type frequent_t3000_device --dispatch-mode ""' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: TTMetal_build_${{ matrix.test-group.arch }} | ||
- name: Extract files | ||
run: tar -xvf ttm_${{ matrix.test-group.arch }}.tar | ||
- uses: ./.github/actions/install-python-deps | ||
- name: Run frequent regression tests | ||
timeout-minutes: 60 | ||
run: | | ||
source ${{ github.workspace }}/python_env/bin/activate | ||
cd $TT_METAL_HOME | ||
export PYTHONPATH=$TT_METAL_HOME | ||
${{ matrix.test-group.cmd }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,87 @@ | ||
name: "[T3K] T3000 model perf tests" | ||
|
||
on: | ||
workflow_dispatch: | ||
schedule: | ||
- cron: "0 */12 * * *" # This cron schedule runs the workflow every 12 hours | ||
|
||
jobs: | ||
build-artifact: | ||
uses: ./.github/workflows/build-artifact.yaml | ||
with: | ||
arch: '["wormhole_b0"]' | ||
secrets: inherit | ||
t3000-model-perf-tests: | ||
needs: build-artifact | ||
strategy: | ||
fail-fast: false | ||
matrix: | ||
test-group: [ | ||
{ | ||
name: "T3000 LLM model perf tests", | ||
model-type: "LLM", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-perf"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type llm_model_perf_t3000_device --dispatch-mode ""' | ||
}, | ||
{ | ||
name: "T3000 CNN model perf tests", | ||
model-type: "CNN", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-perf"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type cnn_model_perf_t3000_device --dispatch-mode ""' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Enable performance mode | ||
run: | | ||
sudo cpupower frequency-set -g performance | ||
- name: Ensure weka mount is active | ||
run: | | ||
sudo systemctl restart mnt-MLPerf.mount | ||
sudo /etc/rc.local | ||
ls -al /mnt/MLPerf/bit_error_tests | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
echo "PYTHONPATH=$(pwd)" >> $GITHUB_ENV | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: TTMetal_build_${{ matrix.test-group.arch }} | ||
- name: Extract files | ||
run: tar -xvf ttm_${{ matrix.test-group.arch }}.tar | ||
- uses: ./.github/actions/install-python-deps | ||
- name: Run model perf regression tests | ||
timeout-minutes: 60 | ||
run: | | ||
source ${{ github.workspace }}/python_env/bin/activate | ||
cd $TT_METAL_HOME | ||
export PYTHONPATH=$TT_METAL_HOME | ||
${{ matrix.test-group.cmd }} | ||
- name: Check perf report exists | ||
id: check-perf-report | ||
if: ${{ !cancelled() }} | ||
run: | | ||
ls -hal | ||
export PERF_REPORT_FILENAME=Models_Perf_$(date +%Y_%m_%d).csv | ||
ls -hal $PERF_REPORT_FILENAME | ||
echo "perf_report_filename=$PERF_REPORT_FILENAME" >> "$GITHUB_OUTPUT" | ||
- name: Upload perf report | ||
if: ${{ !cancelled() && steps.check-perf-report.conclusion == 'success' }} | ||
uses: actions/upload-artifact@v4 | ||
with: | ||
name: perf-report-csv-${{ matrix.model-type }}-${{ matrix.test-group.arch }}-${{ matrix.test-group.machine-type }} | ||
path: "${{ steps.check-perf-report.outputs.perf_report_filename }}" | ||
- name: Disable performance mode | ||
if: always() | ||
run: | | ||
sudo cpupower frequency-set -g ondemand |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,41 @@ | ||
name: "[T3K] T3000 profiler tests" | ||
|
||
on: | ||
workflow_dispatch: | ||
workflow_call: | ||
schedule: | ||
- cron: "0 */8 * * *" # This cron schedule runs the workflow every 8 hours | ||
|
||
jobs: | ||
t3000-profiler-tests: | ||
strategy: | ||
fail-fast: false | ||
matrix: | ||
test-group: [ | ||
{ | ||
name: "T3000 profiler tests", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-perf"], | ||
cmd: './tests/scripts/run_profiler_regressions.sh' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
- name: Build tt-metal and libs | ||
run: | | ||
./scripts/build_scripts/build_with_profiler_opt.sh | ||
- name: Run profiler regression tests | ||
timeout-minutes: 30 | ||
run: | | ||
./tests/scripts/run_profiler_regressions.sh |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,52 @@ | ||
name: "[T3K] T3000 unit tests" | ||
|
||
on: | ||
workflow_dispatch: | ||
schedule: | ||
- cron: "0 */3 * * *" # This cron schedule runs the workflow every 3 hours | ||
|
||
jobs: | ||
build-artifact: | ||
uses: ./.github/workflows/build-artifact.yaml | ||
with: | ||
arch: '["wormhole_b0"]' | ||
secrets: inherit | ||
t3000-unit-tests: | ||
needs: build-artifact | ||
strategy: | ||
fail-fast: false | ||
matrix: | ||
test-group: [ | ||
{ | ||
name: "T3000 unit tests", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-t3000", "in-service", "runner-test", "bare-metal", "pipeline-functional"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type unit_t3000_device --dispatch-mode ""' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: TTMetal_build_${{ matrix.test-group.arch }} | ||
- name: Extract files | ||
run: tar -xvf ttm_${{ matrix.test-group.arch }}.tar | ||
- uses: ./.github/actions/install-python-deps | ||
- name: Run unit regression tests | ||
timeout-minutes: 120 | ||
run: | | ||
source ${{ github.workspace }}/python_env/bin/activate | ||
cd $TT_METAL_HOME | ||
export PYTHONPATH=$TT_METAL_HOME | ||
${{ matrix.test-group.cmd }} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,49 +1,49 @@ | ||
name: "[TG] TG unit tests" | ||
|
||
on: | ||
push: | ||
branches: | ||
- galaxy/main | ||
schedule: | ||
- cron: '0 0 * * *' # Runs every day at 12am UTC | ||
workflow_dispatch: | ||
|
||
jobs: | ||
build-artifact: | ||
uses: ./.github/workflows/build-artifact.yaml | ||
with: | ||
arch: '["wormhole_b0"]' | ||
secrets: inherit | ||
TG-tests: | ||
needs: build-artifact | ||
strategy: | ||
# Do not fail-fast because we need to ensure all tests go to completion | ||
# so we try not to get hanging machines | ||
fail-fast: false | ||
matrix: | ||
runner-info: [ | ||
# TG | ||
{arch: wormhole_b0, runs-on: ["config-tg", "in-service"]}, | ||
] | ||
test-group: [ | ||
{name: "TG Unit Tests", cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type post_commit_tg --dispatch-mode ""'}, | ||
{ | ||
name: "TG unit tests", | ||
arch: wormhole_b0, | ||
runs-on: [arch-wormhole_b0, "config-tg", "in-service", "runner-test", "bare-metal", "pipeline-functional"], | ||
cmd: './tests/scripts/run_tests.sh --tt-arch wormhole_b0 --pipeline-type unit_tg_device --dispatch-mode ""' | ||
}, | ||
] | ||
name: ${{ matrix.test-group.name }} ${{ matrix.runner-info.arch }} ${{ matrix.runner-info.name }} | ||
name: ${{ matrix.test-group.name }} | ||
env: | ||
TT_METAL_ENV: ${{ vars.TT_METAL_ENV }} | ||
ARCH_NAME: ${{ matrix.runner-info.arch }} | ||
ARCH_NAME: ${{ matrix.test-group.arch }} | ||
LOGURU_LEVEL: INFO | ||
LD_LIBRARY_PATH: ${{ github.workspace }}/build/lib | ||
runs-on: ${{ matrix.runner-info.runs-on }} | ||
environment: dev | ||
runs-on: ${{ matrix.test-group.runs-on }} | ||
steps: | ||
- uses: tenstorrent-metal/metal-workflows/.github/actions/[email protected] | ||
- name: Set up dynamic env vars for build | ||
run: | | ||
echo "TT_METAL_HOME=$(pwd)" >> $GITHUB_ENV | ||
- uses: actions/download-artifact@v4 | ||
with: | ||
name: TTMetal_build_${{ matrix.runner-info.arch }} | ||
name: TTMetal_build_${{ matrix.test-group.arch }} | ||
- name: Extract files | ||
run: tar -xvf ttm_${{ matrix.runner-info.arch }}.tar | ||
run: tar -xvf ttm_${{ matrix.test-group.arch }}.tar | ||
- uses: ./.github/actions/install-python-deps | ||
- name: ${{ matrix.test-group.name }} tests | ||
- name: Run unit regression tests | ||
timeout-minutes: 45 | ||
run: | | ||
source ${{ github.workspace }}/python_env/bin/activate | ||
|
Oops, something went wrong.