diff --git a/README.md b/README.md index 8b7f259..4eacabb 100644 --- a/README.md +++ b/README.md @@ -162,7 +162,7 @@ lbl2idx = {"B": 0, "I": 1, "O": 2} idx2label = {0: "B", 1: "I", 2: "O"} # Tokenizer -tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased", add_prefix_space=True) +tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased") max_length = 512 # Dataset parameters