From 3313d1b28cb9075031b23cdce3a0e80759f8e858 Mon Sep 17 00:00:00 2001 From: ydshieh Date: Tue, 3 Sep 2024 09:07:25 +0200 Subject: [PATCH] use daily ci without sleep 10 --- .github/workflows/model_jobs.yml | 148 +++++++++++++-------------- .github/workflows/self-scheduled.yml | 2 +- 2 files changed, 73 insertions(+), 77 deletions(-) diff --git a/.github/workflows/model_jobs.yml b/.github/workflows/model_jobs.yml index 55ebac46d9e040..ddac81a9e3afb8 100644 --- a/.github/workflows/model_jobs.yml +++ b/.github/workflows/model_jobs.yml @@ -191,7 +191,6 @@ jobs: working-directory: /transformers run: | ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - sleep 10 rm -rf /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist - name: Check cache 9 @@ -205,7 +204,6 @@ jobs: working-directory: /transformers run: | ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - sleep 10 rm -rf /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47 - name: Check cache 9 @@ -218,7 +216,6 @@ jobs: working-directory: /transformers run: | ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - sleep 10 rm -rf /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - name: Check cache 9 @@ -259,79 +256,78 @@ jobs: - name: Check cache 9 working-directory: /transformers run: | - sleep 10 tail -10 /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - - - name: Check cache 9.5 - working-directory: /transformers - run: | - apt-get install -y sudo - - - name: Check cache 9.5 2 - working-directory: /transformers - run: | - apt-get install sudo - - - name: Check cache 10 - working-directory: /transformers - run: | - sudo chown -R nobody:nogroup /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/ - - - name: Check cache 11 - working-directory: /transformers - run: | - ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/ - - - name: Check cache 12 - working-directory: /transformers - run: | - ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist - - - name: Check cache 13 - working-directory: /transformers - run: | - ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47 - - - name: Check cache 14 - working-directory: /transformers - run: | - ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json - - - name: check who I am - working-directory: /transformers - run: | - whoami - -# - name: delete 1 cache +# +# - name: Check cache 9.5 # working-directory: /transformers # run: | -# rm -rf /mnt/cache/hub/models--hf-internal-testing--config-no-model - - - name: Run all tests on GPU - working-directory: /transformers - run: python3 -m pytest -rsfE -v --make-reports=${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports tests/${{ matrix.folders }} - - - name: Failure short reports - if: ${{ failure() }} - continue-on-error: true - run: cat /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports/failures_short.txt - - - name: Run test - shell: bash - run: | - mkdir -p /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports - echo "hello" > /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports/hello.txt - echo "${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports" - - - name: Check cache 9 - working-directory: /transformers - run: | - ls -l /mnt/cache/hub/models--BAAI--AltCLIP/snapshots/b989a7bc9f73809acc4df8265e63174c74791ba6/pytorch_model.bin - - - name: "Test suite reports artifacts: ${{ inputs.machine_type }}_run_models_gpu_${{ env.matrix_folders }}_test_reports" - if: ${{ always() }} - uses: actions/upload-artifact@v4 - with: - name: ${{ inputs.machine_type }}_run_models_gpu_${{ env.matrix_folders }}_test_reports - path: /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports - +# apt-get install -y sudo +# +# - name: Check cache 9.5 2 +# working-directory: /transformers +# run: | +# apt-get install sudo +# +# - name: Check cache 10 +# working-directory: /transformers +# run: | +# sudo chown -R nobody:nogroup /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/ +# +# - name: Check cache 11 +# working-directory: /transformers +# run: | +# ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/ +# +# - name: Check cache 12 +# working-directory: /transformers +# run: | +# ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist +# +# - name: Check cache 13 +# working-directory: /transformers +# run: | +# ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47 +# +# - name: Check cache 14 +# working-directory: /transformers +# run: | +# ls -l /mnt/cache/hub/models--hf-internal-testing--no-config-test-repo/.no_exist/42ce72ae70f7d34c14dbc3a856379a5d5b72de47/config.json +# +# - name: check who I am +# working-directory: /transformers +# run: | +# whoami +# +## - name: delete 1 cache +## working-directory: /transformers +## run: | +## rm -rf /mnt/cache/hub/models--hf-internal-testing--config-no-model +# +# - name: Run all tests on GPU +# working-directory: /transformers +# run: python3 -m pytest -rsfE -v --make-reports=${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports tests/${{ matrix.folders }} +# +# - name: Failure short reports +# if: ${{ failure() }} +# continue-on-error: true +# run: cat /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports/failures_short.txt +# +# - name: Run test +# shell: bash +# run: | +# mkdir -p /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports +# echo "hello" > /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports/hello.txt +# echo "${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports" +# +# - name: Check cache 9 +# working-directory: /transformers +# run: | +# ls -l /mnt/cache/hub/models--BAAI--AltCLIP/snapshots/b989a7bc9f73809acc4df8265e63174c74791ba6/pytorch_model.bin +# +# - name: "Test suite reports artifacts: ${{ inputs.machine_type }}_run_models_gpu_${{ env.matrix_folders }}_test_reports" +# if: ${{ always() }} +# uses: actions/upload-artifact@v4 +# with: +# name: ${{ inputs.machine_type }}_run_models_gpu_${{ env.matrix_folders }}_test_reports +# path: /transformers/reports/${{ inputs.machine_type }}_run_models_gpu_${{ matrix.folders }}_test_reports +# diff --git a/.github/workflows/self-scheduled.yml b/.github/workflows/self-scheduled.yml index 692356c03c4cae..d5a1a179472519 100644 --- a/.github/workflows/self-scheduled.yml +++ b/.github/workflows/self-scheduled.yml @@ -50,7 +50,7 @@ jobs: name: Setup strategy: matrix: - machine_type: [aws-g4dn-2xlarge-cache] + machine_type: [daily-ci] runs-on: group: '${{ matrix.machine_type }}' container: