diff --git a/train.py b/train.py index 10d4c2cd..5748aed9 100644 --- a/train.py +++ b/train.py @@ -4,8 +4,8 @@ """ # feel free to use either -from bpe_regex import Tokenizer as RegexTokenizer -from bpe_basic import Tokenizer as BasicTokenizer +from bpe_regex import RegexTokenizer +from bpe_basic import BasicTokenizer # open some text and train a vocab of 512 tokens text = open("taylorswift.txt", "r", encoding="utf-8").read()