pubchem_encoder.py (#10)

Browse files

- Update smi-ted/training/pubchem_encoder.py (860a7f64e058ebd5eb3480db5bba91f0b633506e)

Co-authored-by: Victor Yukio Shirasuna <vshirasuna@users.noreply.huggingface.co>

Files changed (1) hide show

smi-ted/training/pubchem_encoder.py +1 -1

smi-ted/training/pubchem_encoder.py CHANGED Viewed

@@ -72,7 +72,7 @@ class Encoder():
         if self.add_eos == True:
             char = char + ['<eos>']
-        return torch.tensor([self.char2id[word] for word in char])
     def encoder(self, tokens):
         #return *map(lambda x: self.encode(x), tokens)

         if self.add_eos == True:
             char = char + ['<eos>']
+        return torch.tensor([self.char2id.get(word, self.char2id["<unk>"]) for word in char])
     def encoder(self, tokens):
         #return *map(lambda x: self.encode(x), tokens)