saicharan2804 commited on
Commit
409a8a3
·
1 Parent(s): 0cee7ca

Added token IDs

Browse files
Files changed (2) hide show
  1. BpeTokenizer.py +4 -1
  2. app.py +1 -7
BpeTokenizer.py CHANGED
@@ -9,5 +9,8 @@ def bpe_tokenizer(smiles_string):
9
 
10
  # To get the tokenized output as text
11
  tokens_text = encoded_output.tokens
 
 
 
12
 
13
- return tokens_text
 
9
 
10
  # To get the tokenized output as text
11
  tokens_text = encoded_output.tokens
12
+
13
+ # To get the corresponding token IDs
14
+ token_ids = encoded_output.ids
15
 
16
+ return tokens_text, token_ids
app.py CHANGED
@@ -1,18 +1,12 @@
1
  import gradio as gr
2
  from BpeTokenizer import bpe_tokenizer
3
 
4
- # def tem(name, num = 3):
5
- # return name + num
6
-
7
-
8
- # iface = gr.Interface(fn=tem, inputs=["text", "text"], outputs="text")
9
-
10
  iface = gr.Interface(
11
  fn = bpe_tokenizer,
12
  inputs=[
13
  gr.Textbox(label="SMILES"),
14
  ],
15
- outputs="text"
16
  )
17
 
18
  iface.launch()
 
1
  import gradio as gr
2
  from BpeTokenizer import bpe_tokenizer
3
 
 
 
 
 
 
 
4
  iface = gr.Interface(
5
  fn = bpe_tokenizer,
6
  inputs=[
7
  gr.Textbox(label="SMILES"),
8
  ],
9
+ outputs=["text", "text"]
10
  )
11
 
12
  iface.launch()