Skip to content

Commit 4d0c813

Browse files
cpgaffney1Orbax Authors
authored andcommitted
No public description
PiperOrigin-RevId: 886881258
1 parent 83804f6 commit 4d0c813

31 files changed

+1565
-23
lines changed

checkpoint/orbax/checkpoint/_src/testing/benchmarks/configs/evaluations/model_sizes/llama-405b.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@ mesh_config:
1111
# The checkpoint configuration, shared across all generated benchmarks.
1212
checkpoint_config:
1313
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-405B-checkpoints/0/items"
14+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-405b-v5p-128-data-1-fsdp-64-tensor-1/abstract_state.json"
1415

1516
benchmarks:
1617
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"

checkpoint/orbax/checkpoint/_src/testing/benchmarks/configs/evaluations/model_sizes/llama-70b.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@ mesh_config:
1111
# The checkpoint configuration, shared across all generated benchmarks.
1212
checkpoint_config:
1313
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-70B-checkpoints/0/items"
14+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-70b-v5p-32-data-1-fsdp-16-tensor-1/abstract_state.json"
1415

1516
benchmarks:
1617
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
@@ -23,4 +24,3 @@ benchmarks:
2324
use_zarr3: true
2425
use_replica_parallel: false
2526
use_compression: true
26-
enable_trace: true

checkpoint/orbax/checkpoint/_src/testing/benchmarks/configs/evaluations/model_sizes/llama-8b.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@ mesh_config:
1010
# The checkpoint configuration, shared across all generated benchmarks.
1111
checkpoint_config:
1212
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-8B-checkpoints/0/items"
13+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-8b-v5p-8-data-1-fsdp-4-tensor-1/abstract_state.json"
1314

1415
benchmarks:
1516
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-128 (64 chips)
3+
suite_name: "Llama 3.1 405B"
4+
num_repeats: 20
5+
6+
7+
mesh_config:
8+
mesh_axes: ["data", "fsdp", "tensor"]
9+
ici_parallelism: {"data": 1, "fsdp": 64, "tensor": 1}
10+
11+
# The checkpoint configuration, shared across all generated benchmarks.
12+
checkpoint_config:
13+
path: "gs://orbax-benchmarks/checkpoints/llama-405b_generate_1-64-1"
14+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-405b-v5p-128-data-1-fsdp-64-tensor-1/abstract_state.json"
15+
16+
benchmarks:
17+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
18+
options:
19+
# --- Generator Options ---
20+
# These keys must match the attributes of the `BenchmarkOptions` class
21+
# associated with the `Benchmark` generator.
22+
async_enabled: true
23+
use_ocdbt: true
24+
use_zarr3: true
25+
use_replica_parallel: false
26+
use_compression: true
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-32 (16 chips)
3+
suite_name: "Llama 3.1 70B"
4+
num_repeats: 20
5+
6+
7+
mesh_config:
8+
mesh_axes: ["data", "fsdp", "tensor"]
9+
ici_parallelism: {"data": 1, "fsdp": 16, "tensor": 1}
10+
11+
# The checkpoint configuration, shared across all generated benchmarks.
12+
checkpoint_config:
13+
path: "gs://orbax-benchmarks/checkpoints/llama-70b_generate_1-16-1"
14+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-70b-v5p-32-data-1-fsdp-16-tensor-1/abstract_state.json"
15+
16+
benchmarks:
17+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
18+
options:
19+
# --- Generator Options ---
20+
# These keys must match the attributes of the `BenchmarkOptions` class
21+
# associated with the `Benchmark` generator.
22+
async_enabled: true
23+
use_ocdbt: true
24+
use_zarr3: true
25+
use_replica_parallel: false
26+
use_compression: true
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-8 (4 chips)
3+
suite_name: "Llama 3.1 8B"
4+
num_repeats: 20
5+
6+
mesh_config:
7+
mesh_axes: ["data", "fsdp", "tensor"]
8+
ici_parallelism: {"data": 1, "fsdp": 4, "tensor": 1}
9+
10+
# The checkpoint configuration, shared across all generated benchmarks.
11+
checkpoint_config:
12+
path: "gs://orbax-benchmarks/checkpoints/llama-8b_generate_1-4-1"
13+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-8b-v5p-8-data-1-fsdp-4-tensor-1/abstract_state.json"
14+
15+
benchmarks:
16+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
17+
options:
18+
# --- Generator Options ---
19+
# These keys must match the attributes of the `BenchmarkOptions` class
20+
# associated with the `Benchmark` generator.
21+
async_enabled: true
22+
use_ocdbt: true
23+
use_zarr3: true
24+
use_replica_parallel: false
25+
use_compression: true
Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-128 (64 chips)
3+
suite_name: "Llama 3.1 405B"
4+
num_repeats: 1
5+
6+
7+
mesh_config:
8+
mesh_axes: ["data", "fsdp", "tensor"]
9+
# Should match reference_sharding_path.
10+
ici_parallelism: {"data": 1, "fsdp": 64, "tensor": 1}
11+
12+
# Note: checkpoint_config field not specified.
13+
checkpoint_config:
14+
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-405B-checkpoints/0/items"
15+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-405b-v5p-128-data-1-fsdp-64-tensor-1/abstract_state.json"
16+
17+
benchmarks:
18+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
19+
options:
20+
# --- Generator Options ---
21+
# These keys must match the attributes of the `BenchmarkOptions` class
22+
# associated with the `Benchmark` generator.
23+
async_enabled: true
24+
use_ocdbt: true
25+
use_zarr3: true
26+
use_replica_parallel: false
27+
use_compression: true
Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-32 (16 chips)
3+
suite_name: "Llama 3.1 70B"
4+
num_repeats: 1
5+
6+
7+
mesh_config:
8+
mesh_axes: ["data", "fsdp", "tensor"]
9+
# Should match reference_sharding_path.
10+
ici_parallelism: {"data": 1, "fsdp": 16, "tensor": 1}
11+
12+
# Note: checkpoint_config field not specified.
13+
checkpoint_config:
14+
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-70B-checkpoints/0/items"
15+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-70b-v5p-32-data-1-fsdp-16-tensor-1/abstract_state.json"
16+
17+
benchmarks:
18+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
19+
options:
20+
# --- Generator Options ---
21+
# These keys must match the attributes of the `BenchmarkOptions` class
22+
# associated with the `Benchmark` generator.
23+
async_enabled: true
24+
use_ocdbt: true
25+
use_zarr3: true
26+
use_replica_parallel: false
27+
use_compression: true
Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
# The name for the entire test suite run.
2+
# Assumes v5p-8 (4 chips)
3+
suite_name: "Llama 3.1 8B"
4+
num_repeats: 1
5+
6+
7+
mesh_config:
8+
mesh_axes: ["data", "fsdp", "tensor"]
9+
# Should match reference_sharding_path.
10+
ici_parallelism: {"data": 1, "fsdp": 4, "tensor": 1}
11+
12+
# Note: checkpoint_config field not specified.
13+
checkpoint_config:
14+
path: "gs://orbax-benchmarks/checkpoints/llama-3.1-8B-checkpoints/0/items"
15+
sharding_config_path: "gs://orbax-benchmarks/sharding-configs/llama3.1-8b-v5p-8-data-1-fsdp-4-tensor-1/abstract_state.json"
16+
17+
benchmarks:
18+
- generator: "orbax.checkpoint._src.testing.benchmarks.v1.benchmark.Benchmark"
19+
options:
20+
# --- Generator Options ---
21+
# These keys must match the attributes of the `BenchmarkOptions` class
22+
# associated with the `Benchmark` generator.
23+
async_enabled: true
24+
use_ocdbt: true
25+
use_zarr3: true
26+
use_replica_parallel: false
27+
use_compression: true

0 commit comments

Comments
 (0)