Skip to content

Commit 3469f9c

Browse files
authored
Merge branch 'main' into feature/torchtitan/add-deepseek-model
2 parents fe44824 + c69ee12 commit 3469f9c

18 files changed

+70
-16
lines changed

examples/torchtitan/configs/MI300X/llama3.1_405B-pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
work_group: ${PRIMUS_TEAM:amd}
22
user_name: ${PRIMUS_USER:root}
3-
exp_name: ${PRIMUS_EXP_NAME:llama3_405B-pretrain}
3+
exp_name: ${PRIMUS_EXP_NAME:llama3.1_405B-pretrain}
44
workspace: ./output
55

66
modules:

examples/torchtitan/configs/MI300X/llama3.1_70B-BF16-pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
work_group: ${PRIMUS_TEAM:amd}
22
user_name: ${PRIMUS_USER:root}
3-
exp_name: ${PRIMUS_EXP_NAME:llama3_70B-pretrain}
3+
exp_name: ${PRIMUS_EXP_NAME:llama3.1_70B-pretrain}
44
workspace: ./output
55

66
modules:

examples/torchtitan/configs/MI300X/llama3.1_70B-FP8-pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
work_group: ${PRIMUS_TEAM:amd}
22
user_name: ${PRIMUS_USER:root}
3-
exp_name: ${PRIMUS_EXP_NAME:llama3_70B-pretrain}
3+
exp_name: ${PRIMUS_EXP_NAME:llama3.1_70B-pretrain}
44
workspace: ./output
55

66
modules:

examples/torchtitan/configs/MI300X/llama3.1_8B-BF16-pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
work_group: ${PRIMUS_TEAM:amd}
22
user_name: ${PRIMUS_USER:root}
3-
exp_name: ${PRIMUS_EXP_NAME:llama3_8B-pretrain}
3+
exp_name: ${PRIMUS_EXP_NAME:llama3.1_8B-pretrain}
44
workspace: ./output
55

66
modules:

examples/torchtitan/configs/MI300X/llama3.1_8B-FP8-pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
work_group: ${PRIMUS_TEAM:amd}
22
user_name: ${PRIMUS_USER:root}
3-
exp_name: ${PRIMUS_EXP_NAME:llama3_8B-pretrain}
3+
exp_name: ${PRIMUS_EXP_NAME:llama3.1_8B-pretrain}
44
workspace: ./output
55

66
modules:

primus/configs/models/megatron/llama3_70B.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ bases:
22
- llama3_base.yaml
33

44
tokenizer_type: Llama3Tokenizer
5-
tokenizer_model: meta-llama/Llama-3.1-70B
5+
tokenizer_model: meta-llama/Meta-Llama-3-70B
66

77
ffn_hidden_size: 28672
88
hidden_size: 8192

primus/configs/models/megatron/llama3_8B.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ bases:
22
- llama3_base.yaml
33

44
tokenizer_type: Llama3Tokenizer
5-
tokenizer_model: meta-llama/Llama-3.1-8B
5+
tokenizer_model: meta-llama/Meta-Llama-3-8B
66

77

88
ffn_hidden_size: 14336

primus/configs/models/torchtitan/llama3.1_405B.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,5 +5,4 @@ job:
55
model:
66
name: "llama3"
77
flavor: "405B"
8-
hf_assets_path: "meta-llama/Llama-3.1-8B"
9-
# converters = ["float8"]
8+
hf_assets_path: "meta-llama/Llama-3.1-405B"

primus/configs/models/torchtitan/llama3.1_70B-fp8.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
job:
22
dump_folder: "./outputs"
3-
description: "Llama 3 70B training"
3+
description: "Llama 3.1 70B training"
44

55
model:
66
name: "llama3"
Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,8 @@
11
job:
22
dump_folder: "./outputs"
3-
description: "Llama 3 70B training"
3+
description: "Llama 3.1 70B training"
44

55
model:
66
name: "llama3"
77
flavor: "70B"
8-
hf_assets_path: "meta-llama/Llama-3.1-8B"
9-
# converters = ["float8"]
8+
hf_assets_path: "meta-llama/Llama-3.1-70B"

0 commit comments

Comments
 (0)