lm error
Browse files
balanced_bokmaal_nynorsk_lm_base.gin
CHANGED
|
@@ -12,7 +12,7 @@ MIXTURE_OR_TASK_NAME = "balanced_bokmaal_nynorsk_prefix_lm_stream"
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
-
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_base/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
|
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
+
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/pretrained_models/base/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_base/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
balanced_bokmaal_nynorsk_lm_large.gin
CHANGED
|
@@ -12,7 +12,7 @@ MIXTURE_OR_TASK_NAME = "balanced_bokmaal_nynorsk_prefix_lm_stream"
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
-
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_large/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
|
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
+
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/pretrained_models/large/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_large/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
balanced_bokmaal_nynorsk_lm_small.gin
CHANGED
|
@@ -12,7 +12,7 @@ MIXTURE_OR_TASK_NAME = "balanced_bokmaal_nynorsk_prefix_lm_stream"
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
-
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_small/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
|
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
+
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/pretrained_models/small/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_small/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
balanced_bokmaal_nynorsk_lm_xl.gin
CHANGED
|
@@ -12,7 +12,7 @@ MIXTURE_OR_TASK_NAME = "balanced_bokmaal_nynorsk_prefix_lm_stream"
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
-
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_xl/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
|
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
+
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/pretrained_models/xl/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_xl/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
balanced_bokmaal_nynorsk_lm_xxl.gin
CHANGED
|
@@ -12,7 +12,7 @@ MIXTURE_OR_TASK_NAME = "balanced_bokmaal_nynorsk_prefix_lm_stream"
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
-
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_xxl/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|
|
|
|
| 12 |
TASK_FEATURE_LENGTHS = {"inputs": 512, "targets": 512}
|
| 13 |
TRAIN_STEPS = 1_800_000
|
| 14 |
DROPOUT_RATE = 0.0 # Changed from the default since T5-1.1 recomments this.
|
| 15 |
+
INITIAL_CHECKPOINT_PATH = "gs://north-t5x/pretrained_models/xxl/norwegian_NCC_plus_English_pluss200k_balanced_bokmaal_nynorsk_t5x_xxl/checkpoint_1700000"
|
| 16 |
#PjitPartitioner.num_partitions = 2
|
| 17 |
utils.SaveCheckpointConfig.period = 5000
|
| 18 |
utils.SaveCheckpointConfig.keep = 3
|