Skip to content

Commit d322ff8

Browse files
authored
Merge pull request #6330 from flybird11111/main
[release] release version
2 parents ddbbbaa + 4afff92 commit d322ff8

29 files changed

+43
-43
lines changed

.cuda_ext.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,11 +2,11 @@
22
"build": [
33
{
44
"torch_command": "pip install torch==2.3.0 torchvision==0.18.0 torchaudio==2.3.0 --index-url https://download.pytorch.org/whl/cu121",
5-
"cuda_image": "hpcaitech/cuda-conda:12.1"
5+
"cuda_image": "image-cloud.luchentech.com/hpcaitech/cuda-conda:12.1"
66
},
77
{
88
"torch_command": "pip install torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1 --index-url https://download.pytorch.org/whl/cu124",
9-
"cuda_image": "hpcaitech/cuda-conda:12.4"
9+
"cuda_image": "image-cloud.luchentech.com/hpcaitech/cuda-conda:12.4"
1010
}
1111
]
1212
}

.github/workflows/build_on_schedule.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ jobs:
1212
if: github.repository == 'hpcaitech/ColossalAI'
1313
runs-on: [self-hosted, gpu]
1414
container:
15-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
15+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
1616
options: --gpus all --rm -v /dev/shm -v /data/scratch/:/data/scratch/
1717
timeout-minutes: 90
1818
steps:

.github/workflows/close_inactive.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ on:
77
jobs:
88
close-issues:
99
if: github.event.pull_request.draft == false && github.base_ref == 'main' && github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
10-
runs-on: ubuntu-latest
10+
runs-on: [self-hosted, ubuntu-latest]-latest
1111
permissions:
1212
issues: write
1313
pull-requests: write

.github/workflows/compatiblity_test_on_dispatch.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ on:
1515
jobs:
1616
matrix_preparation:
1717
name: Prepare Container List
18-
runs-on: ubuntu-latest
18+
runs-on: [self-hosted, ubuntu-latest]-latest
1919
outputs:
2020
matrix: ${{ steps.set-matrix.outputs.matrix }}
2121
steps:
@@ -31,7 +31,7 @@ jobs:
3131
do
3232
for cv in $CUDA_VERSIONS
3333
do
34-
DOCKER_IMAGE+=("\"hpcaitech/pytorch-cuda:${tv}-${cv}\"")
34+
DOCKER_IMAGE+=("\"image-cloud.luchentech.com/hpcaitech/pytorch-cuda:${tv}-${cv}\"")
3535
done
3636
done
3737
@@ -44,7 +44,7 @@ jobs:
4444
name: Test for PyTorch Compatibility
4545
needs: matrix_preparation
4646
if: github.repository == 'hpcaitech/ColossalAI'
47-
runs-on: [self-hosted, 8-gpu]
47+
runs-on: [self-hosted, ubuntu-latest]
4848
strategy:
4949
fail-fast: false
5050
matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}}

.github/workflows/compatiblity_test_on_pr.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ on:
99
jobs:
1010
matrix_preparation:
1111
name: Prepare Container List
12-
runs-on: ubuntu-latest
12+
runs-on: [self-hosted, ubuntu-latest]-latest
1313
outputs:
1414
matrix: ${{ steps.set-matrix.outputs.matrix }}
1515
concurrency:
@@ -23,7 +23,7 @@ jobs:
2323
DOCKER_IMAGE=()
2424
2525
while read tag; do
26-
DOCKER_IMAGE+=("\"hpcaitech/pytorch-cuda:${tag}\"")
26+
DOCKER_IMAGE+=("\"image-cloud.luchentech.com/hpcaitech/pytorch-cuda:${tag}\"")
2727
done <.compatibility
2828
2929
container=$( IFS=',' ; echo "${DOCKER_IMAGE[*]}" )
@@ -35,7 +35,7 @@ jobs:
3535
name: Test for PyTorch Compatibility
3636
needs: matrix_preparation
3737
if: github.repository == 'hpcaitech/ColossalAI'
38-
runs-on: [self-hosted, 8-gpu]
38+
runs-on: [self-hosted, ubuntu-latest]
3939
strategy:
4040
fail-fast: false
4141
matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}}

.github/workflows/compatiblity_test_on_schedule.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ on:
99
jobs:
1010
matrix_preparation:
1111
name: Prepare Container List
12-
runs-on: ubuntu-latest
12+
runs-on: [self-hosted, ubuntu-latest]-latest
1313
outputs:
1414
matrix: ${{ steps.set-matrix.outputs.matrix }}
1515
steps:
@@ -20,7 +20,7 @@ jobs:
2020
DOCKER_IMAGE=()
2121
2222
while read tag; do
23-
DOCKER_IMAGE+=("\"hpcaitech/pytorch-cuda:${tag}\"")
23+
DOCKER_IMAGE+=("\"image-cloud.luchentech.com/hpcaitech/pytorch-cuda:${tag}\"")
2424
done <.compatibility
2525
2626
container=$( IFS=',' ; echo "${DOCKER_IMAGE[*]}" )
@@ -32,7 +32,7 @@ jobs:
3232
name: Test for PyTorch Compatibility
3333
needs: matrix_preparation
3434
if: github.repository == 'hpcaitech/ColossalAI'
35-
runs-on: [self-hosted, 8-gpu]
35+
runs-on: [self-hosted, ubuntu-latest]
3636
strategy:
3737
fail-fast: false
3838
matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}}

.github/workflows/cuda_ext_check_before_merge.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ jobs:
1010
matrix_preparation:
1111
name: Prepare Container List
1212
if: github.repository == 'hpcaitech/ColossalAI'
13-
runs-on: ubuntu-latest
13+
runs-on: [self-hosted,ubuntu-latest]
1414
outputs:
1515
matrix: ${{ steps.set-matrix.outputs.matrix }}
1616
steps:
@@ -24,7 +24,7 @@ jobs:
2424
build:
2525
name: Release bdist wheels
2626
needs: matrix_preparation
27-
runs-on: [self-hosted, gpu]
27+
runs-on: [self-hosted, ubuntu-latest]
2828
strategy:
2929
fail-fast: false
3030
matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}}

.github/workflows/doc_build_on_schedule_after_release.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ jobs:
1111
build-doc:
1212
name: Trigger Documentation Build Workflow
1313
if: github.repository == 'hpcaitech/ColossalAI'
14-
runs-on: ubuntu-latest
14+
runs-on: [self-hosted, ubuntu-latest]-latest
1515
steps:
1616
- name: trigger workflow in ColossalAI-Documentation
1717
run: |

.github/workflows/doc_check_on_pr.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ jobs:
1515
if: |
1616
github.event.pull_request.draft == false &&
1717
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
18-
runs-on: ubuntu-latest
18+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1919
concurrency:
2020
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-check-i18n
2121
cancel-in-progress: true
@@ -33,7 +33,7 @@ jobs:
3333
if: |
3434
github.event.pull_request.draft == false &&
3535
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
36-
runs-on: ubuntu-latest
36+
runs-on: [self-hosted, ubuntu-latest]-latest
3737
concurrency:
3838
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-check-doc
3939
cancel-in-progress: true

.github/workflows/doc_test_on_pr.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ jobs:
1515
if: |
1616
github.event.pull_request.draft == false &&
1717
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' && github.event_name == 'pull_request'
18-
runs-on: ubuntu-latest
18+
runs-on: [self-hosted, ubuntu-latest]-latest
1919
outputs:
2020
any_changed: ${{ steps.changed-files.outputs.any_changed }}
2121
changed_files: ${{ steps.changed-files.outputs.all_changed_files }}
@@ -56,7 +56,7 @@ jobs:
5656
needs: detect-changed-doc
5757
runs-on: [self-hosted, gpu]
5858
container:
59-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
59+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
6060
options: --gpus all --rm
6161
timeout-minutes: 30
6262
defaults:

.github/workflows/doc_test_on_schedule.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ jobs:
1212
name: Test the changed Doc
1313
runs-on: [self-hosted, gpu]
1414
container:
15-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
15+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
1616
options: --gpus all --rm
1717
timeout-minutes: 60
1818
steps:

.github/workflows/draft_github_release_post_after_merge.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ jobs:
1212
release:
1313
name: Draft Release Post
1414
if: ( github.event_name == 'workflow_dispatch' || github.event.pull_request.merged == true ) && github.repository == 'hpcaitech/ColossalAI'
15-
runs-on: ubuntu-latest
15+
runs-on: [self-hosted, ubuntu-latest]-latest
1616
steps:
1717
- uses: actions/checkout@v2
1818
with:

.github/workflows/example_check_on_dispatch.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ jobs:
1414
github.base_ref == 'main' &&
1515
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
1616
name: Check the examples user want
17-
runs-on: ubuntu-latest
17+
runs-on: [self-hosted, ubuntu-latest]-latest
1818
outputs:
1919
matrix: ${{ steps.set-matrix.outputs.matrix }}
2020
steps:
@@ -45,7 +45,7 @@ jobs:
4545
fail-fast: false
4646
matrix: ${{fromJson(needs.manual_check_matrix_preparation.outputs.matrix)}}
4747
container:
48-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
48+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
4949
options: --gpus all --rm -v /data/scratch/examples-data:/data/ -v /dev/shm
5050
timeout-minutes: 15
5151
steps:

.github/workflows/example_check_on_pr.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ jobs:
1717
if: |
1818
github.event.pull_request.draft == false &&
1919
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI' && github.event_name == 'pull_request'
20-
runs-on: ubuntu-latest
20+
runs-on: [self-hosted, ubuntu-latest]-latest
2121
outputs:
2222
matrix: ${{ steps.setup-matrix.outputs.matrix }}
2323
anyChanged: ${{ steps.setup-matrix.outputs.anyChanged }}
@@ -90,7 +90,7 @@ jobs:
9090
fail-fast: false
9191
matrix: ${{fromJson(needs.detect-changed-example.outputs.matrix)}}
9292
container:
93-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
93+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
9494
options: --gpus all --rm -v /data/scratch/examples-data:/data/ -v /dev/shm
9595
timeout-minutes: 30
9696
concurrency:

.github/workflows/example_check_on_schedule.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ jobs:
1010
matrix_preparation:
1111
if: github.repository == 'hpcaitech/ColossalAI'
1212
name: Prepare matrix for weekly check
13-
runs-on: ubuntu-latest
13+
runs-on: ubunt[self-hosted, ubuntu-latest]u-latest
1414
outputs:
1515
matrix: ${{ steps.setup-matrix.outputs.matrix }}
1616
steps:
@@ -34,7 +34,7 @@ jobs:
3434
fail-fast: false
3535
matrix: ${{fromJson(needs.matrix_preparation.outputs.matrix)}}
3636
container:
37-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
37+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
3838
options: --gpus all --rm -v /data/scratch/examples-data:/data/ -v /dev/shm
3939
timeout-minutes: 30
4040
steps:

.github/workflows/release_docker_after_publish.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ jobs:
4646
notify:
4747
name: Notify Lark via webhook
4848
needs: release
49-
runs-on: ubuntu-latest
49+
runs-on: [self-hosted, ubuntu-latest]-latest
5050
if: ${{ always() }}
5151
steps:
5252
- uses: actions/checkout@v2

.github/workflows/release_nightly_on_schedule.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ jobs:
99
publish:
1010
if: github.repository == 'hpcaitech/ColossalAI'
1111
name: Build and publish Python 🐍 distributions 📦 to PyPI
12-
runs-on: ubuntu-latest
12+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1313
timeout-minutes: 20
1414
outputs:
1515
status: ${{ steps.publish.outcome }}
@@ -36,7 +36,7 @@ jobs:
3636
notify:
3737
name: Notify Lark via webhook
3838
needs: publish
39-
runs-on: ubuntu-latest
39+
runs-on: [self-hosted, ubuntu-latest]-latest
4040
if: ${{ always() }} && github.repository == 'hpcaitech/ColossalAI'
4141
steps:
4242
- uses: actions/checkout@v2

.github/workflows/release_pypi_after_merge.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ jobs:
1212
build-n-publish:
1313
if: github.event_name == 'workflow_dispatch' || github.repository == 'hpcaitech/ColossalAI' && github.event.pull_request.merged == true && github.base_ref == 'main'
1414
name: Build and publish Python 🐍 distributions 📦 to PyPI
15-
runs-on: ubuntu-latest
15+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1616
timeout-minutes: 20
1717
steps:
1818
- uses: actions/checkout@v2
@@ -35,7 +35,7 @@ jobs:
3535
notify:
3636
name: Notify Lark via webhook
3737
needs: build-n-publish
38-
runs-on: ubuntu-latest
38+
runs-on: [self-hosted, ubuntu-latest]-latest
3939
if: ${{ always() }}
4040
steps:
4141
- uses: actions/checkout@v2

.github/workflows/release_test_pypi_before_merge.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ jobs:
99
build-n-publish:
1010
if: github.event_name == 'workflow_dispatch' || github.repository == 'hpcaitech/ColossalAI'
1111
name: Build and publish Python 🐍 distributions 📦 to Test PyPI
12-
runs-on: ubuntu-latest
12+
runs-on: [self-hosted, ubuntu-latest]-latest
1313
timeout-minutes: 20
1414
steps:
1515
- uses: actions/checkout@v2

.github/workflows/report_leaderboard_to_lark.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ jobs:
1010
generate-and-publish:
1111
if: github.repository == 'hpcaitech/ColossalAI'
1212
name: Generate leaderboard report and publish to Lark
13-
runs-on: ubuntu-latest
13+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1414
timeout-minutes: 20
1515
steps:
1616
- uses: actions/checkout@v2

.github/workflows/report_test_coverage.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ on:
88

99
jobs:
1010
report-test-coverage:
11-
runs-on: ubuntu-latest
11+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1212
if: ${{ github.event.workflow_run.conclusion == 'success' }}
1313
steps:
1414
- name: "Download artifact"

.github/workflows/run_chatgpt_examples.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ jobs:
1919
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
2020
runs-on: [self-hosted, gpu]
2121
container:
22-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
22+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
2323
options: --gpus all --rm -v /data/scratch/examples-data:/data/scratch/examples-data --shm-size=10.24gb
2424
timeout-minutes: 60
2525
defaults:

.github/workflows/run_chatgpt_unit_tests.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ jobs:
1919
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
2020
runs-on: [self-hosted, gpu]
2121
container:
22-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
22+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
2323
options: --gpus all --rm -v /data/scratch/examples-data:/data/scratch/examples-data
2424
timeout-minutes: 30
2525
defaults:

.github/workflows/run_colossalqa_unit_tests.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ jobs:
1919
github.event.pull_request.base.repo.full_name == 'hpcaitech/ColossalAI'
2020
runs-on: [self-hosted, gpu]
2121
container:
22-
image: hpcaitech/pytorch-cuda:2.2.2-12.1.0
22+
image: image-cloud.luchentech.com/hpcaitech/pytorch-cuda:2.2.2-12.1.0
2323
volumes:
2424
- /data/scratch/test_data_colossalqa:/data/scratch/test_data_colossalqa
2525
- /data/scratch/llama-tiny:/data/scratch/llama-tiny

.github/workflows/submodule.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ on:
77

88
jobs:
99
sync-submodule:
10-
runs-on: ubuntu-latest
10+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1111
if: github.repository == 'hpcaitech/ColossalAI'
1212
steps:
1313
- name: Checkout

.github/workflows/translate_comment.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ on:
77

88
jobs:
99
build:
10-
runs-on: ubuntu-latest
10+
runs-on: ubuntu-[self-hosted, ubuntu-latest]
1111
steps:
1212
- uses: usthe/[email protected]
1313
with:

tests/kit/model_zoo/transformers/gpt.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -113,6 +113,7 @@ def date_gen_for_double_heads():
113113
problem_type="single_label_classification",
114114
pad_token_id=1022,
115115
tie_word_embeddings=True,
116+
attn_implementation="eager",
116117
)
117118

118119
config_for_token_classification = copy.deepcopy(config)

tests/test_zero/test_gemini/test_inference.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -114,7 +114,6 @@ def run_dist(rank, world_size, port):
114114
exam_inference()
115115

116116

117-
@pytest.mark.skip("this test failed")
118117
@pytest.mark.dist
119118
@pytest.mark.parametrize("world_size", [1, 4])
120119
def test_inference(world_size):

version.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
0.4.9
1+
0.5.0

0 commit comments

Comments
 (0)