File tree Expand file tree Collapse file tree 2 files changed +10
-2
lines changed Expand file tree Collapse file tree 2 files changed +10
-2
lines changed Original file line number Diff line number Diff line change @@ -30,7 +30,6 @@ seq_len = 4096
30
30
warmup_steps = 200 # lr scheduler warm up
31
31
max_norm = 1.0 # grad norm clipping
32
32
steps = 1000
33
- # only dp would be sufficient for 7B
34
33
data_parallel_degree = -1
35
34
# 8-way TP, adjust to 2/4 for local(single host) runs
36
35
tensor_parallel_degree = 8
@@ -41,3 +40,8 @@ checkpoint_interval = 3600
41
40
checkpoint_interval_type = " steps"
42
41
checkpoint_folder = " "
43
42
dataset = " openwebtext"
43
+
44
+
45
+ [activation_checkpoint ]
46
+ mode = ' selective' # ['none', 'full', 'selective']
47
+ selective_ac_option = ' op' # 'int' = ac every positive int layer or 'op', ac based on ops policy
Original file line number Diff line number Diff line change @@ -30,7 +30,6 @@ seq_len = 4096
30
30
warmup_steps = 200 # lr scheduler warm up
31
31
max_norm = 1.0 # grad norm clipping
32
32
steps = 1000
33
- # only dp would be sufficient for 7B
34
33
data_parallel_degree = -1
35
34
# 8-way TP
36
35
tensor_parallel_degree = 8
@@ -41,3 +40,8 @@ checkpoint_interval = 3600
41
40
checkpoint_interval_type = " steps"
42
41
checkpoint_folder = " "
43
42
dataset = " openwebtext"
43
+
44
+
45
+ [activation_checkpoint ]
46
+ mode = ' selective' # ['none', 'full', 'selective']
47
+ selective_ac_option = ' 2' # 'int' = ac every positive int layer or 'op', ac based on ops policy
You can’t perform that action at this time.
0 commit comments