Skip to content

Commit 7a1cfa2

Browse files
Merge branch 'main' into lcalabri/ci_test_lang_mod_eager_lazy
2 parents 51e97a1 + 4842376 commit 7a1cfa2

File tree

118 files changed

+10830
-866
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

118 files changed

+10830
-866
lines changed

.github/workflows/fast_tests.yml

+10-4
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ concurrency:
1515
jobs:
1616
transformers:
1717
name: Run tests for optimum.habana.transformers
18-
runs-on: [self-hosted, linux, x64, gaudi2]
18+
runs-on: [self-hosted, linux, x64, gaudi2, fast]
1919
steps:
2020
- name: Checkout
2121
uses: actions/checkout@v2
@@ -25,19 +25,22 @@ jobs:
2525
- name: Run tests
2626
run: |
2727
docker run \
28+
--rm \
2829
-v $PWD:/root/workspace \
30+
-v /scratch-1:/data \
2931
--workdir=/root/workspace \
3032
--runtime=habana \
31-
-e HABANA_VISIBLE_DEVICES=all \
33+
-e HABANA_VISIBLE_DEVICES=$DOCKER_HABANA_VISIBLE_DEVICES \
3234
-e OMPI_MCA_btl_vader_single_copy_mechanism=none \
35+
-e HF_HOME=/data \
3336
--cap-add=sys_nice \
3437
--net=host \
3538
--ipc=host \
3639
vault.habana.ai/gaudi-docker/1.18.0/ubuntu22.04/habanalabs/pytorch-installer-2.4.0:latest \
3740
/bin/bash tests/ci/fast_tests.sh
3841
diffusers:
3942
name: Run tests for optimum.habana.diffusers
40-
runs-on: [self-hosted, linux, x64, gaudi2]
43+
runs-on: [self-hosted, linux, x64, gaudi2, fast]
4144
steps:
4245
- name: Checkout
4346
uses: actions/checkout@v2
@@ -47,11 +50,14 @@ jobs:
4750
- name: Run tests
4851
run: |
4952
docker run \
53+
--rm \
5054
-v $PWD:/root/workspace \
55+
-v /scratch-1:/data \
5156
--workdir=/root/workspace \
5257
--runtime=habana \
53-
-e HABANA_VISIBLE_DEVICES=all \
58+
-e HABANA_VISIBLE_DEVICES=$DOCKER_HABANA_VISIBLE_DEVICES \
5459
-e OMPI_MCA_btl_vader_single_copy_mechanism=none \
60+
-e HF_HOME=/data \
5561
--cap-add=sys_nice \
5662
--net=host \
5763
--ipc=host \

.github/workflows/slow_tests_gaudi2.yml

+34-8
Original file line numberDiff line numberDiff line change
@@ -9,9 +9,35 @@ concurrency:
99
group: ${{ github.workflow }}
1010

1111
jobs:
12+
example-diff:
13+
name: Test examples differences
14+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
15+
steps:
16+
- name: Checkout
17+
uses: actions/checkout@v2
18+
- name: Pull image
19+
run: |
20+
docker pull vault.habana.ai/gaudi-docker/1.18.0/ubuntu22.04/habanalabs/pytorch-installer-2.4.0:latest
21+
- name: Run tests
22+
run: |
23+
docker run \
24+
--rm \
25+
-v $PWD:/root/workspace \
26+
--workdir=/root/workspace \
27+
--runtime=habana \
28+
-e HABANA_VISIBLE_DEVICES=all \
29+
-e OMPI_MCA_btl_vader_single_copy_mechanism=none \
30+
--cap-add=sys_nice \
31+
--net=host \
32+
--ipc=host \
33+
vault.habana.ai/gaudi-docker/1.18.0/ubuntu22.04/habanalabs/pytorch-installer-2.4.0:latest \
34+
/bin/bash tests/ci/example_diff_tests.sh
1235
stable-diffusion:
1336
name: Test Stable Diffusion
14-
runs-on: [self-hosted, linux, x64, gaudi2]
37+
if: ${{ !cancelled() && (success() || failure()) }}
38+
needs:
39+
- example-diff # run the job when the previous test job is done
40+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
1541
steps:
1642
- name: Checkout
1743
uses: actions/checkout@v2
@@ -40,7 +66,7 @@ jobs:
4066
if: ${{ !cancelled() && (success() || failure()) }}
4167
needs:
4268
- stable-diffusion # run the job when the previous test job is done
43-
runs-on: [self-hosted, linux, x64, gaudi2]
69+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
4470
steps:
4571
- name: Checkout
4672
uses: actions/checkout@v2
@@ -69,7 +95,7 @@ jobs:
6995
if: ${{ !cancelled() && (success() || failure()) }}
7096
needs:
7197
- deepspeed # run the job when the previous test job is done
72-
runs-on: [self-hosted, linux, x64, gaudi2]
98+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
7399
steps:
74100
- name: Checkout
75101
uses: actions/checkout@v2
@@ -98,7 +124,7 @@ jobs:
98124
if: ${{ !cancelled() && (success() || failure()) }}
99125
needs:
100126
- fsdp # run the job when the previous test job is done
101-
runs-on: [self-hosted, linux, x64, gaudi2]
127+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
102128
steps:
103129
- name: Checkout
104130
uses: actions/checkout@v2
@@ -128,7 +154,7 @@ jobs:
128154
needs:
129155
- deepspeed
130156
- multi-card # run the job when the previous test jobs are done
131-
runs-on: [self-hosted, linux, x64, gaudi2]
157+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
132158
steps:
133159
- name: Checkout
134160
uses: actions/checkout@v2
@@ -160,7 +186,7 @@ jobs:
160186
- deepspeed
161187
- multi-card
162188
- single-card # run the job when the previous test jobs are done
163-
runs-on: [self-hosted, linux, x64, gaudi2]
189+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
164190
steps:
165191
- name: Checkout
166192
uses: actions/checkout@v2
@@ -189,7 +215,7 @@ jobs:
189215
if: ${{ !cancelled() && (success() || failure()) }}
190216
needs:
191217
- text-generation
192-
runs-on: [self-hosted, linux, x64, gaudi2]
218+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
193219
steps:
194220
- name: Checkout
195221
uses: actions/checkout@v2
@@ -218,7 +244,7 @@ jobs:
218244
if: ${{ !cancelled() && (success() || failure()) }}
219245
needs:
220246
- trl
221-
runs-on: [self-hosted, linux, x64, gaudi2]
247+
runs-on: [self-hosted, linux, x64, gaudi2, nightly]
222248
steps:
223249
- name: Checkout Optimum Habana
224250
uses: actions/checkout@v2

README.md

+5
Original file line numberDiff line numberDiff line change
@@ -214,6 +214,7 @@ The following model architectures, tasks and device distributions have been vali
214214
| Qwen2 | <div style="text-align:left"><li>Single card</li></div> | <div style="text-align:left"><li>Single card</li></div> | <li>[language modeling](https://github.com/huggingface/optimum-habana/tree/main/examples/language-modeling)</li><li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
215215
| Qwen2-MoE | | <div style="text-align:left"><li>Single card</li></div> | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
216216
| Gemma | :heavy_check_mark: | <div style="text-align:left"><li>Single card</li></div> | <li>[language modeling](https://github.com/huggingface/optimum-habana/tree/main/examples/language-modeling)</li><li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
217+
| Gemma2 | | :heavy_check_mark: | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
217218
| XGLM | | <div style="text-align:left"><li>Single card</li></div> | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
218219
| Cohere | | <div style="text-align:left"><li>Single card</li></div> | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
219220
| T5 / Flan T5 | :heavy_check_mark: | :heavy_check_mark: | <li>[summarization](https://github.com/huggingface/optimum-habana/tree/main/examples/summarization)</li><li>[translation](https://github.com/huggingface/optimum-habana/tree/main/examples/translation)</li><li>[question answering](https://github.com/huggingface/optimum-habana/tree/main/examples/question-answering#fine-tuning-t5-on-squad20)</li> |
@@ -231,11 +232,14 @@ The following model architectures, tasks and device distributions have been vali
231232
| ClipSeg | | <div style="text-align:left"><li>Single card</li></div> | <li>[object segmentation](https://github.com/huggingface/optimum-habana/tree/main/examples/object-segementation)</li> |
232233
| Llava / Llava-next | | <div style="text-align:left"><li>Single card</li></div> | <li>[image to text](https://github.com/huggingface/optimum-habana/tree/main/examples/image-to-text)</li> |
233234
| idefics2 | <div style="text-align:left"><li>LoRA</li></div> | <div style="text-align:left"><li>Single card</li></div> | <li>[image to text](https://github.com/huggingface/optimum-habana/tree/main/examples/image-to-text)</li> |
235+
| Paligemma | | <div style="text-align:left"><li>Single card</li></div> | <li>[image to text](https://github.com/huggingface/optimum-habana/tree/main/examples/image-to-text)</li> |
234236
| Segment Anything Model | | <div style="text-align:left"><li>Single card</li></div> | <li>[object segmentation](https://github.com/huggingface/optimum-habana/tree/main/examples/object-segementation)</li> |
235237
| VideoMAE | | <div style="text-align:left"><li>Single card</li></div> | <li>[Video classification](https://github.com/huggingface/optimum-habana/tree/main/examples/video-classification)</li> |
236238
| TableTransformer | | <div style="text-align:left"><li>Single card</li></div> | <li>[table object detection](https://github.com/huggingface/optimum-habana/tree/main/examples/table-detection) </li> |
237239
| DETR | | <div style="text-align:left"><li>Single card</li></div> | <li>[object detection](https://github.com/huggingface/optimum-habana/tree/main/examples/object-detection)</li> |
238240
| Mllama | <div style="text-align:left"><li>LoRA</li></div> | :heavy_check_mark: | <li>[image to text](https://github.com/huggingface/optimum-habana/tree/main/examples/image-to-text)</li> |
241+
| MiniCPM3 | | <div style="text-align:left"><li>Single card</li></div> | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
242+
| Baichuan2 | | <div style="text-align:left"><li>Single card</li></div> | <li>[text generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-generation)</li> |
239243
240244
</div>
241245
@@ -249,6 +253,7 @@ The following model architectures, tasks and device distributions have been vali
249253
| Stable Diffusion XL | <li>[fine-tuning](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion/training#fine-tuning-for-stable-diffusion-xl)</li> | <li>Single card</li> | <li>[text-to-image generation](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion)</li> |
250254
| Stable Diffusion Depth2img | | <li>Single card</li> | <li>[depth-to-image generation](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion)</li> |
251255
| LDM3D | | <li>Single card</li> | <li>[text-to-image generation](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion)</li> |
256+
| FLUX.1 | <li>[fine-tuning](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion/training#dreambooth-lora-fine-tuning-with-flux1-dev)</li> | <li>Single card</li> | <li>[text-to-image generation](https://github.com/huggingface/optimum-habana/tree/main/examples/stable-diffusion)</li> |
252257
| Text to Video | | <li>Single card</li> | <li>[text-to-video generation](https://github.com/huggingface/optimum-habana/tree/main/examples/text-to-video)</li> |
253258
254259
</div>

docs/source/_toctree.yml

+9-11
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
- sections:
22
- local: index
3-
title: 🤗 Optimum Habana
3+
title: 🤗 Optimum for Intel Gaudi
44
- local: installation
55
title: Installation
66
- local: quickstart
@@ -16,12 +16,14 @@
1616
title: Run Inference
1717
- local: tutorials/stable_diffusion
1818
title: Stable Diffusion
19-
- local: tutorials/stable_diffusion_ldm3d
20-
title: LDM3D
19+
- local: tutorials/tgi
20+
title: TGI on Gaudi
2121
title: Tutorials
2222
- sections:
2323
- local: usage_guides/overview
2424
title: Overview
25+
- local: usage_guides/script_adaptation
26+
title: Script Adaptation
2527
- local: usage_guides/pretraining
2628
title: Pretraining Transformers
2729
- local: usage_guides/accelerate_training
@@ -32,20 +34,16 @@
3234
title: How to use DeepSpeed
3335
- local: usage_guides/multi_node_training
3436
title: Multi-node Training
37+
- local: usage_guides/quantization
38+
title: Quantization
3539
title: How-To Guides
36-
- sections:
37-
- local: concept_guides/hpu
38-
title: What are Habana's Gaudi and HPUs?
39-
title: Conceptual Guides
4040
- sections:
4141
- local: package_reference/trainer
4242
title: Gaudi Trainer
4343
- local: package_reference/gaudi_config
4444
title: Gaudi Configuration
45-
- local: package_reference/stable_diffusion_pipeline
46-
title: Gaudi Stable Diffusion Pipeline
4745
- local: package_reference/distributed_runner
4846
title: Distributed Runner
4947
title: Reference
50-
title: Optimum Habana
51-
isExpanded: false
48+
title: Optimum for Intel Gaudi
49+
isExpanded: false

docs/source/concept_guides/hpu.mdx

-49
This file was deleted.

0 commit comments

Comments
 (0)