diff --git a/config.json b/config.json index eb8ff65..d301ef0 100644 --- a/config.json +++ b/config.json @@ -22,7 +22,7 @@ "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 13696, - "max_position_embeddings": 64000, + "max_position_embeddings": 65536, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 2, diff --git a/tokenizer_config.json b/tokenizer_config.json index d4864cb..f4fdf71 100644 --- a/tokenizer_config.json +++ b/tokenizer_config.json @@ -211,7 +211,7 @@ "input_ids", "attention_mask" ], - "model_max_length": 64000, + "model_max_length": 65536, "padding_side": "left", "remove_space": false, "tokenizer_class": "PreTrainedTokenizer"