All CI jobs with A10 (#39119)
all a10 Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
This commit is contained in:
2
.github/workflows/check_failed_tests.yml
vendored
2
.github/workflows/check_failed_tests.yml
vendored
@@ -41,7 +41,7 @@ jobs:
|
|||||||
check_new_failures:
|
check_new_failures:
|
||||||
name: " "
|
name: " "
|
||||||
runs-on:
|
runs-on:
|
||||||
group: aws-g4dn-4xlarge-cache
|
group: aws-g5-4xlarge-cache
|
||||||
container:
|
container:
|
||||||
image: ${{ inputs.docker }}
|
image: ${{ inputs.docker }}
|
||||||
options: --gpus all --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
options: --gpus all --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
||||||
|
|||||||
2
.github/workflows/doctest_job.yml
vendored
2
.github/workflows/doctest_job.yml
vendored
@@ -28,7 +28,7 @@ jobs:
|
|||||||
matrix:
|
matrix:
|
||||||
split_keys: ${{ fromJson(inputs.split_keys) }}
|
split_keys: ${{ fromJson(inputs.split_keys) }}
|
||||||
runs-on:
|
runs-on:
|
||||||
group: aws-g4dn-4xlarge-cache
|
group: aws-g5-4xlarge-cache
|
||||||
container:
|
container:
|
||||||
image: huggingface/transformers-all-latest-gpu
|
image: huggingface/transformers-all-latest-gpu
|
||||||
options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
||||||
|
|||||||
2
.github/workflows/doctests.yml
vendored
2
.github/workflows/doctests.yml
vendored
@@ -15,7 +15,7 @@ jobs:
|
|||||||
setup:
|
setup:
|
||||||
name: Setup
|
name: Setup
|
||||||
runs-on:
|
runs-on:
|
||||||
group: aws-g4dn-4xlarge-cache
|
group: aws-g5-4xlarge-cache
|
||||||
container:
|
container:
|
||||||
image: huggingface/transformers-all-latest-gpu
|
image: huggingface/transformers-all-latest-gpu
|
||||||
options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
|
||||||
|
|||||||
4
.github/workflows/model_jobs.yml
vendored
4
.github/workflows/model_jobs.yml
vendored
@@ -107,9 +107,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ inputs.machine_type }}"
|
echo "${{ inputs.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ inputs.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ inputs.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ inputs.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ inputs.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ inputs.machine_type }}
|
machine_type=${{ inputs.machine_type }}
|
||||||
|
|||||||
12
.github/workflows/self-comment-ci.yml
vendored
12
.github/workflows/self-comment-ci.yml
vendored
@@ -185,7 +185,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
folders: ${{ fromJson(needs.get-tests.outputs.models) }}
|
folders: ${{ fromJson(needs.get-tests.outputs.models) }}
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -239,9 +239,9 @@ jobs:
|
|||||||
shell: bash
|
shell: bash
|
||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -292,7 +292,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
folders: ${{ fromJson(needs.get-tests.outputs.quantizations) }}
|
folders: ${{ fromJson(needs.get-tests.outputs.quantizations) }}
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -338,9 +338,9 @@ jobs:
|
|||||||
shell: bash
|
shell: bash
|
||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
|
|||||||
26
.github/workflows/self-push.yml
vendored
26
.github/workflows/self-push.yml
vendored
@@ -31,7 +31,7 @@ jobs:
|
|||||||
name: Setup
|
name: Setup
|
||||||
strategy:
|
strategy:
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-2xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -131,7 +131,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
folders: ${{ fromJson(needs.setup.outputs.matrix) }}
|
folders: ${{ fromJson(needs.setup.outputs.matrix) }}
|
||||||
machine_type: [aws-g4dn-2xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -169,9 +169,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -244,7 +244,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
folders: ${{ fromJson(needs.setup.outputs.matrix) }}
|
folders: ${{ fromJson(needs.setup.outputs.matrix) }}
|
||||||
machine_type: [aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -282,9 +282,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -357,7 +357,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-2xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -395,9 +395,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -467,7 +467,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -505,9 +505,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-2xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
|
|||||||
28
.github/workflows/self-scheduled.yml
vendored
28
.github/workflows/self-scheduled.yml
vendored
@@ -50,7 +50,7 @@ jobs:
|
|||||||
name: Setup
|
name: Setup
|
||||||
strategy:
|
strategy:
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -128,7 +128,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
slice_id: [0, 1]
|
slice_id: [0, 1]
|
||||||
uses: ./.github/workflows/model_jobs.yml
|
uses: ./.github/workflows/model_jobs.yml
|
||||||
with:
|
with:
|
||||||
@@ -145,7 +145,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -179,9 +179,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -213,7 +213,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-4xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -247,9 +247,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -282,7 +282,7 @@ jobs:
|
|||||||
strategy:
|
strategy:
|
||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -344,9 +344,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
@@ -381,7 +381,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
folders: ${{ fromJson(needs.setup.outputs.quantization_matrix) }}
|
folders: ${{ fromJson(needs.setup.outputs.quantization_matrix) }}
|
||||||
machine_type: [aws-g4dn-4xlarge-cache, aws-g4dn-12xlarge-cache]
|
machine_type: [aws-g5-4xlarge-cache, aws-g5-12xlarge-cache]
|
||||||
runs-on:
|
runs-on:
|
||||||
group: '${{ matrix.machine_type }}'
|
group: '${{ matrix.machine_type }}'
|
||||||
container:
|
container:
|
||||||
@@ -424,9 +424,9 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
echo "${{ matrix.machine_type }}"
|
echo "${{ matrix.machine_type }}"
|
||||||
|
|
||||||
if [ "${{ matrix.machine_type }}" = "aws-g4dn-4xlarge-cache" ]; then
|
if [ "${{ matrix.machine_type }}" = "aws-g5-4xlarge-cache" ]; then
|
||||||
machine_type=single-gpu
|
machine_type=single-gpu
|
||||||
elif [ "${{ matrix.machine_type }}" = "aws-g4dn-12xlarge-cache" ]; then
|
elif [ "${{ matrix.machine_type }}" = "aws-g5-12xlarge-cache" ]; then
|
||||||
machine_type=multi-gpu
|
machine_type=multi-gpu
|
||||||
else
|
else
|
||||||
machine_type=${{ matrix.machine_type }}
|
machine_type=${{ matrix.machine_type }}
|
||||||
|
|||||||
Reference in New Issue
Block a user