|
20 | 20 | except ModuleNotFoundError:
|
21 | 21 | import tomli as tomllib
|
22 | 22 |
|
| 23 | +test_with_rocm = os.getenv("TEST_WITH_ROCM", "0") |
| 24 | + |
23 | 25 |
|
24 | 26 | @dataclass
|
25 | 27 | class OverrideDefinitions:
|
@@ -139,28 +141,34 @@ def build_test_list():
|
139 | 141 | "Checkpoint Integration Test - Save Model Weights Only bf16",
|
140 | 142 | "model_weights_only_bf16",
|
141 | 143 | ),
|
142 |
| - OverrideDefinitions( |
143 |
| - [ |
144 |
| - [ |
145 |
| - "--parallelism.pipeline_parallel_degree 4", |
146 |
| - "--parallelism.pipeline_parallel_schedule InterleavedZeroBubble", |
| 144 | + ] |
| 145 | + # check test_with_rocm |
| 146 | + if test_with_rocm != "1": |
| 147 | + integration_tests_flavors["debug_model.toml"].extend([ |
| 148 | + OverrideDefinitions( |
| 149 | + [ |
| 150 | + [ |
| 151 | + "--parallelism.pipeline_parallel_degree 4", |
| 152 | + "--parallelism.pipeline_parallel_schedule InterleavedZeroBubble", |
| 153 | + ], |
147 | 154 | ],
|
148 |
| - ], |
149 |
| - "PP looped zero bubble test", |
150 |
| - "pp_looped_zero_bubble", |
151 |
| - ngpu=4, |
152 |
| - ), |
153 |
| - OverrideDefinitions( |
154 |
| - [ |
155 |
| - [ |
156 |
| - "--parallelism.pipeline_parallel_degree 2", |
157 |
| - "--parallelism.pipeline_parallel_schedule ZBVZeroBubble", |
| 155 | + "PP looped zero bubble test", |
| 156 | + "pp_looped_zero_bubble", |
| 157 | + ngpu=4, |
| 158 | + ), |
| 159 | + OverrideDefinitions( |
| 160 | + [ |
| 161 | + [ |
| 162 | + "--parallelism.pipeline_parallel_degree 2", |
| 163 | + "--parallelism.pipeline_parallel_schedule ZBVZeroBubble", |
| 164 | + ], |
158 | 165 | ],
|
159 |
| - ], |
160 |
| - "PP zero bubble test (v shaped)", |
161 |
| - "pp_zbv", |
162 |
| - ngpu=2, |
163 |
| - ), |
| 166 | + "PP zero bubble test (v shaped)", |
| 167 | + "pp_zbv", |
| 168 | + ngpu=2, |
| 169 | + ), |
| 170 | + ]) |
| 171 | + integration_tests_flavors["debug_model.toml"].extend([ |
164 | 172 | OverrideDefinitions(
|
165 | 173 | [
|
166 | 174 | [
|
@@ -272,18 +280,24 @@ def build_test_list():
|
272 | 280 | "pp_looped_1f1b",
|
273 | 281 | ngpu=4,
|
274 | 282 | ),
|
275 |
| - OverrideDefinitions( |
276 |
| - [ |
277 |
| - [ |
278 |
| - "--parallelism.pipeline_parallel_degree 2", |
279 |
| - "--parallelism.pipeline_parallel_schedule PipelineScheduleMulti", |
280 |
| - "--parallelism.pipeline_parallel_schedule_csv ./tests/assets/custom_schedule.csv", |
| 283 | + ]) |
| 284 | + # check test_with_rocm |
| 285 | + if test_with_rocm != "1": |
| 286 | + integration_tests_flavors["debug_model.toml"].extend( |
| 287 | + OverrideDefinitions( |
| 288 | + [ |
| 289 | + [ |
| 290 | + "--parallelism.pipeline_parallel_degree 2", |
| 291 | + "--parallelism.pipeline_parallel_schedule PipelineScheduleMulti", |
| 292 | + "--parallelism.pipeline_parallel_schedule_csv ./tests/assets/custom_schedule.csv", |
| 293 | + ], |
281 | 294 | ],
|
282 |
| - ], |
283 |
| - "PP with custom pipeline schedule loaded from CSV file", |
284 |
| - "pp_custom_csv", |
285 |
| - ngpu=2, |
286 |
| - ), |
| 295 | + "PP with custom pipeline schedule loaded from CSV file", |
| 296 | + "pp_custom_csv", |
| 297 | + ngpu=2, |
| 298 | + ), |
| 299 | + ) |
| 300 | + integration_tests_flavors["debug_model.toml"].extend([ |
287 | 301 | OverrideDefinitions(
|
288 | 302 | [
|
289 | 303 | [
|
@@ -494,7 +508,7 @@ def build_test_list():
|
494 | 508 | "Float8 emulation test",
|
495 | 509 | "float8_emulation",
|
496 | 510 | ),
|
497 |
| - ] |
| 511 | + ]) |
498 | 512 | return integration_tests_flavors
|
499 | 513 |
|
500 | 514 |
|
|
0 commit comments