3 changed files with 0 additions and 24 deletions
--- a/README.md
+++ b/README.md
@ -1,5 +0,0 @@
-# Transformer-based Translator
-
-Simple Transformer
-
-! [](image/Screenshot_20230329_023305.png)
--- a/image/Screenshot_20230329_023305.png
+++ b/image/Screenshot_20230329_023305.png
--- a/predict.py
+++ b/predict.py
@ -22,25 +22,6 @@ SHOW_NUM = 5
 NUM_HEADS = 8
 DROPOUT_RATE = 0.5

-def en2tokens(en_sentence, en_vocab, for_model=False, en_seq=50):
-    '''
-        English to tokens
-
-        Args:
-            en_sentence (str)
-            en_vocab (torchtext.Vocab)
-            
-            for_model (bool, default=False): if `True`, it will add <SOS>, <END>, <PAD> tokens
-            en_seq (int): for padding <PAD>
-        Outputs:
-            tokens (LongTensor): (b,)
-    '''
-    tokenizer = torchtext.data.utils.get_tokenizer("basic_english")
-    tokens = en_vocab( tokenizer(en_sentence.lower()) )
-    if for_model:
-        tokens = [ en_vocab['<SOS>'] ] + tokens + [ en_vocab['<END>'] ]
-        tokens = tokens + [ en_vocab['<PAD>'] for _ in range(en_seq - len(tokens)) ]
-    return torch.LongTensor(tokens)

 def predict(en_str, model, en_vocab, ch_vocab):