Skip to content

Commit 4676eb0

Browse files
authored
Merge branch 'master' into loadams/amd-57
2 parents e92426b + 3194fe8 commit 4676eb0

File tree

121 files changed

+2905
-781
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

121 files changed

+2905
-781
lines changed

.github/workflows/amd-mi200.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ jobs:
2525
# Steps represent a sequence of tasks that will be executed as part of the job
2626
steps:
2727
# Checks-out your repository under $GITHUB_WORKSPACE, so your job can access it
28-
- uses: actions/checkout@v3
28+
- uses: actions/checkout@v4
2929

3030
- id: setup-venv
3131
uses: ./.github/workflows/setup-venv

.github/workflows/cpu-torch-latest.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ jobs:
2222
runs-on: ubuntu-20.04
2323

2424
steps:
25-
- uses: actions/checkout@v3
25+
- uses: actions/checkout@v4
2626

2727
- id: setup-venv
2828
uses: ./.github/workflows/setup-venv

.github/workflows/formatting.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ jobs:
2121
runs-on: ubuntu-20.04
2222

2323
steps:
24-
- uses: actions/checkout@v3
24+
- uses: actions/checkout@v4
2525

2626
- name: environment
2727
run: |

.github/workflows/hpu-gaudi2.yml

Lines changed: 19 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,23 @@ on:
88
paths:
99
- ".github/workflows/hpu-gaudi2.yml"
1010
- "accelerator/hpu_accelerator.py"
11-
11+
- "op_builder/hpu/**"
12+
- "deepspeed/runtime/engine.py"
13+
- "deepspeed/runtime/bf16_optimizer.py"
14+
- "deepspeed/runtime/zero/stage_1_and_2.py"
15+
- "deepspeed/runtime/zero/stage3.py"
16+
- "deepspeed/runtime/zero/partition_parameters.py"
17+
- "deepspeed/runtime/zero/partitioned_param_coordinator.py"
18+
- "deepspeed/runtime/zero/parameter_offload.py"
19+
- "deepspeed/runtime/pipe/engine.py"
20+
- "deepspeed/runtime/utils.py"
21+
- "deepspeed/inference/engine.py"
22+
- "deepspeed/module_inject/auto_tp.py"
23+
- "deepspeed/module_inject/replace_module.py"
24+
- "deepspeed/module_inject/load_checkpoint.py"
25+
- "deepspeed/module_inject/inject.py"
26+
- "deepspeed/ops/transformer/**"
27+
- "deepspeed/ops/adam/**"
1228

1329
concurrency:
1430
group: ${{ github.workflow }}-${{ github.ref }}
@@ -23,7 +39,7 @@ jobs:
2339
# The type of runner that the job will run on
2440
runs-on: [self-hosted, intel, gaudi2]
2541
container:
26-
image: vault.habana.ai/gaudi-docker/1.14.0/ubuntu22.04/habanalabs/pytorch-installer-2.1.1:latest
42+
image: vault.habana.ai/gaudi-docker/1.15.0/ubuntu22.04/habanalabs/pytorch-installer-2.2.0:latest
2743
ports:
2844
- 80
2945
options: --runtime=habana -e HABANA_VISIBLE_DEVICES=all -e OMPI_MCA_btl_vader_single_copy_mechanism=none --cap-add=sys_nice
@@ -83,7 +99,7 @@ jobs:
8399
# Steps represent a sequence of tasks that will be executed as part of the job
84100
steps:
85101
# Checks-out your repository under $GITHUB_WORKSPACE, so your job can access it
86-
- uses: actions/checkout@v3
102+
- uses: actions/checkout@v4
87103

88104
- name: Check container state
89105
run: |

.github/workflows/nv-a6000.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ jobs:
2929
options: --gpus all --shm-size "8G"
3030

3131
steps:
32-
- uses: actions/checkout@v3
32+
- uses: actions/checkout@v4
3333

3434
- name: Check container state
3535
run: |

.github/workflows/nv-accelerate-v100.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,10 +19,10 @@ concurrency:
1919

2020
jobs:
2121
unit-tests:
22-
runs-on: [self-hosted, nvidia, cu116, v100]
22+
runs-on: [self-hosted, nvidia, cu117, v100]
2323

2424
steps:
25-
- uses: actions/checkout@v3
25+
- uses: actions/checkout@v4
2626

2727
- id: setup-venv
2828
uses: ./.github/workflows/setup-venv

.github/workflows/nv-ds-chat.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,10 +21,10 @@ permissions:
2121

2222
jobs:
2323
unit-tests:
24-
runs-on: [self-hosted, nvidia, cu116, v100]
24+
runs-on: [self-hosted, nvidia, cu117, v100]
2525

2626
steps:
27-
- uses: actions/checkout@v3
27+
- uses: actions/checkout@v4
2828

2929
- id: setup-venv
3030
uses: ./.github/workflows/setup-venv

.github/workflows/nv-h100.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ jobs:
2323
options: --gpus all --shm-size "8G"
2424

2525
steps:
26-
- uses: actions/checkout@v3
26+
- uses: actions/checkout@v4
2727

2828
- name: Check container state
2929
run: |

.github/workflows/nv-inference.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,10 @@ concurrency:
2222

2323
jobs:
2424
unit-tests:
25-
runs-on: [self-hosted, nvidia, cu116, v100]
25+
runs-on: [self-hosted, nvidia, cu117, v100]
2626

2727
steps:
28-
- uses: actions/checkout@v3
28+
- uses: actions/checkout@v4
2929

3030
- id: setup-venv
3131
uses: ./.github/workflows/setup-venv

.github/workflows/nv-mii.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,10 +27,10 @@ concurrency:
2727

2828
jobs:
2929
unit-tests:
30-
runs-on: [self-hosted, nvidia, cu116, v100]
30+
runs-on: [self-hosted, nvidia, cu117, v100]
3131

3232
steps:
33-
- uses: actions/checkout@v3
33+
- uses: actions/checkout@v4
3434

3535
- id: setup-venv
3636
uses: ./.github/workflows/setup-venv

0 commit comments

Comments
 (0)