"git@developer.sourcefind.cn:chenpangpang/transformers.git" did not exist on "61400e1ec7898892e77314dd819c1a1a52bd5268"
Unverified Commit d903abfc authored by Yih-Dar's avatar Yih-Dar Committed by GitHub
Browse files

Fix AMD CI not showing GPU (#27555)



fix
Co-authored-by: default avatarydshieh <ydshieh@users.noreply.github.com>
parent fe3ce061
...@@ -38,14 +38,16 @@ jobs: ...@@ -38,14 +38,16 @@ jobs:
runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}'] runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}']
container: container:
image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now
options: --device /dev/kfd --device /dev/dri --env HIP_VISIBLE_DEVICES --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ options: --device /dev/kfd --device /dev/dri --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
steps: steps:
- name: ROCM-SMI - name: ROCM-SMI
run: |
rocm-smi
- name: ROCM-INFO
run: | run: |
rocminfo | grep "Agent" -A 14 rocminfo | grep "Agent" -A 14
- name: Show HIP environment - name: Show ROCR environment
run: | run: |
echo "HIP: $HIP_VISIBLE_DEVICES"
echo "ROCR: $ROCR_VISIBLE_DEVICES" echo "ROCR: $ROCR_VISIBLE_DEVICES"
setup_gpu: setup_gpu:
...@@ -57,7 +59,7 @@ jobs: ...@@ -57,7 +59,7 @@ jobs:
runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}'] runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}']
container: container:
image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now
options: --device /dev/kfd --device /dev/dri --env HIP_VISIBLE_DEVICES --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ options: --device /dev/kfd --device /dev/dri --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
outputs: outputs:
matrix: ${{ steps.set-matrix.outputs.matrix }} matrix: ${{ steps.set-matrix.outputs.matrix }}
test_map: ${{ steps.set-matrix.outputs.test_map }} test_map: ${{ steps.set-matrix.outputs.test_map }}
...@@ -155,7 +157,7 @@ jobs: ...@@ -155,7 +157,7 @@ jobs:
runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}'] runs-on: [self-hosted, docker-gpu, amd-gpu, '${{ matrix.machine_type }}', '${{ inputs.gpu_flavor }}']
container: container:
image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now image: huggingface/transformers-pytorch-amd-gpu-push-ci # <--- We test only for PyTorch for now
options: --device /dev/kfd --device /dev/dri --env HIP_VISIBLE_DEVICES --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ options: --device /dev/kfd --device /dev/dri --env ROCR_VISIBLE_DEVICES --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
steps: steps:
# Necessary to get the correct branch name and commit SHA for `workflow_run` event # Necessary to get the correct branch name and commit SHA for `workflow_run` event
# We also take into account the `push` event (we might want to test some changes in a branch) # We also take into account the `push` event (we might want to test some changes in a branch)
...@@ -206,11 +208,13 @@ jobs: ...@@ -206,11 +208,13 @@ jobs:
echo "matrix_folders=$matrix_folders" >> $GITHUB_ENV echo "matrix_folders=$matrix_folders" >> $GITHUB_ENV
- name: ROCM-SMI - name: ROCM-SMI
run: |
rocm-smi
- name: ROCM-INFO
run: | run: |
rocminfo | grep "Agent" -A 14 rocminfo | grep "Agent" -A 14
- name: Show HIP environment - name: Show ROCR environment
run: | run: |
echo "HIP: $HIP_VISIBLE_DEVICES"
echo "ROCR: $ROCR_VISIBLE_DEVICES" echo "ROCR: $ROCR_VISIBLE_DEVICES"
- name: Environment - name: Environment
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment