mirror of
https://github.com/huggingface/transformers.git
synced 2025-07-03 04:40:06 +06:00
restructure AMD scheduled CI (#27743)
* fix --------- Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
This commit is contained in:
parent
e739a361bc
commit
e0d2e69582
25
.github/workflows/self-scheduled-amd-caller.yml
vendored
25
.github/workflows/self-scheduled-amd-caller.yml
vendored
@ -3,23 +3,12 @@ name: Self-hosted runner (AMD scheduled CI caller)
|
||||
on:
|
||||
schedule:
|
||||
- cron: "17 2 * * *"
|
||||
push:
|
||||
branches:
|
||||
- run_amd_scheduled_ci_caller*
|
||||
|
||||
jobs:
|
||||
run_amd_ci_mi210:
|
||||
name: AMD mi210
|
||||
if: (cancelled() != true) && ((github.event_name == 'schedule') || ((github.event_name == 'push') && startsWith(github.ref_name, 'run_amd_scheduled_ci_caller')))
|
||||
uses: ./.github/workflows/self-scheduled-amd.yml
|
||||
with:
|
||||
gpu_flavor: mi210
|
||||
secrets: inherit
|
||||
|
||||
run_amd_ci_mi250:
|
||||
name: AMD mi250
|
||||
if: (cancelled() != true) && ((github.event_name == 'schedule') || ((github.event_name == 'push') && startsWith(github.ref_name, 'run_amd_scheduled_ci_caller')))
|
||||
uses: ./.github/workflows/self-scheduled-amd.yml
|
||||
with:
|
||||
gpu_flavor: mi250
|
||||
secrets: inherit
|
||||
run_scheduled_amd_ci:
|
||||
name: Trigger Scheduled AMD CI
|
||||
runs-on: ubuntu-22.04
|
||||
if: ${{ always() }}
|
||||
steps:
|
||||
- name: Trigger scheduled AMD CI via workflow_run
|
||||
run: echo "Trigger scheduled AMD CI via workflow_run"
|
||||
|
19
.github/workflows/self-scheduled-amd-mi210-caller.yml
vendored
Normal file
19
.github/workflows/self-scheduled-amd-mi210-caller.yml
vendored
Normal file
@ -0,0 +1,19 @@
|
||||
name: Self-hosted runner (AMD mi210 scheduled CI caller)
|
||||
|
||||
on:
|
||||
workflow_run:
|
||||
workflows: ["Self-hosted runner (AMD scheduled CI caller)"]
|
||||
branches: ["main"]
|
||||
types: [completed]
|
||||
push:
|
||||
branches:
|
||||
- run_amd_scheduled_ci_caller*
|
||||
|
||||
jobs:
|
||||
run_amd_ci:
|
||||
name: AMD mi210
|
||||
if: (cancelled() != true) && ((github.event_name == 'schedule') || ((github.event_name == 'push') && startsWith(github.ref_name, 'run_amd_scheduled_ci_caller')))
|
||||
uses: ./.github/workflows/self-scheduled-amd.yml
|
||||
with:
|
||||
gpu_flavor: mi210
|
||||
secrets: inherit
|
19
.github/workflows/self-scheduled-amd-mi250-caller.yml
vendored
Normal file
19
.github/workflows/self-scheduled-amd-mi250-caller.yml
vendored
Normal file
@ -0,0 +1,19 @@
|
||||
name: Self-hosted runner (AMD mi250 scheduled CI caller)
|
||||
|
||||
on:
|
||||
workflow_run:
|
||||
workflows: ["Self-hosted runner (AMD scheduled CI caller)"]
|
||||
branches: ["main"]
|
||||
types: [completed]
|
||||
push:
|
||||
branches:
|
||||
- run_amd_scheduled_ci_caller*
|
||||
|
||||
jobs:
|
||||
run_amd_ci:
|
||||
name: AMD mi250
|
||||
if: (cancelled() != true) && ((github.event_name == 'schedule') || ((github.event_name == 'push') && startsWith(github.ref_name, 'run_amd_scheduled_ci_caller')))
|
||||
uses: ./.github/workflows/self-scheduled-amd.yml
|
||||
with:
|
||||
gpu_flavor: mi250
|
||||
secrets: inherit
|
2
.github/workflows/self-scheduled-amd.yml
vendored
2
.github/workflows/self-scheduled-amd.yml
vendored
@ -438,7 +438,7 @@ jobs:
|
||||
CI_SLACK_CHANNEL_DUMMY_TESTS: ${{ secrets.CI_SLACK_CHANNEL_DUMMY_TESTS }}
|
||||
CI_SLACK_REPORT_CHANNEL_ID: ${{ secrets.CI_SLACK_CHANNEL_ID_DAILY_AMD }}
|
||||
ACCESS_REPO_INFO_TOKEN: ${{ secrets.ACCESS_REPO_INFO_TOKEN }}
|
||||
CI_EVENT: Scheduled CI (AMD)
|
||||
CI_EVENT: Scheduled CI (AMD) - ${{ inputs.gpu_flavor }}
|
||||
CI_SHA: ${{ github.sha }}
|
||||
CI_WORKFLOW_REF: ${{ github.workflow_ref }}
|
||||
RUNNER_STATUS: ${{ needs.check_runner_status.result }}
|
||||
|
@ -119,10 +119,17 @@ class Message:
|
||||
# Failures and success of the additional tests
|
||||
self.n_additional_success = sum(r["success"] for r in additional_results.values())
|
||||
|
||||
all_additional_failures = dicts_to_sum([r["failed"] for r in additional_results.values()])
|
||||
self.n_additional_single_gpu_failures = all_additional_failures["single"]
|
||||
self.n_additional_multi_gpu_failures = all_additional_failures["multi"]
|
||||
self.n_additional_unknown_gpu_failures = all_additional_failures["unclassified"]
|
||||
if len(additional_results) > 0:
|
||||
# `dicts_to_sum` uses `dicts_to_sum` which requires a non empty dictionary. Let's just add an empty entry.
|
||||
all_additional_failures = dicts_to_sum([r["failed"] for r in additional_results.values()])
|
||||
self.n_additional_single_gpu_failures = all_additional_failures["single"]
|
||||
self.n_additional_multi_gpu_failures = all_additional_failures["multi"]
|
||||
self.n_additional_unknown_gpu_failures = all_additional_failures["unclassified"]
|
||||
else:
|
||||
self.n_additional_single_gpu_failures = 0
|
||||
self.n_additional_multi_gpu_failures = 0
|
||||
self.n_additional_unknown_gpu_failures = 0
|
||||
|
||||
self.n_additional_failures = (
|
||||
self.n_additional_single_gpu_failures
|
||||
+ self.n_additional_multi_gpu_failures
|
||||
@ -903,6 +910,9 @@ if __name__ == "__main__":
|
||||
elif ci_event.startswith("Push CI (AMD) - "):
|
||||
flavor = ci_event.replace("Push CI (AMD) - ", "")
|
||||
job_name_prefix = f"AMD {flavor}"
|
||||
elif ci_event.startswith("Scheduled CI (AMD) - "):
|
||||
flavor = ci_event.replace("Scheduled CI (AMD) - ", "")
|
||||
job_name_prefix = f"AMD {flavor}"
|
||||
|
||||
for model in model_results.keys():
|
||||
for artifact_path in available_artifacts[f"run_all_tests_gpu_{model}_test_reports"].paths:
|
||||
|
Loading…
Reference in New Issue
Block a user