deeppunct-gr

Runtime error

wldmr commited on Apr 2, 2023

Commit

072aee3

1 Parent(s): c5c1da9

load nltk

Files changed (2) hide show

app.py CHANGED Viewed

@@ -83,6 +83,8 @@ def predict(brakes, transcript):
 if __name__ == "__main__":
     title = "Deep Punkt App"
     description = """
 <b>Description</b>: <br>

 if __name__ == "__main__":
+    metrics.load_nltk()
     title = "Deep Punkt App"
     description = """
 <b>Description</b>: <br>

metrics.py CHANGED Viewed

@@ -1,8 +1,17 @@
 # Import nltk library for natural language processing
 import nltk
 from transformers import AutoTokenizer
 # Define a function that takes some text as input and returns the number of tokens
 def token_count(text):
     # Import the Encoder class from bpe

 # Import nltk library for natural language processing
 import nltk
+import os
 from transformers import AutoTokenizer
+def load_nltk():
+    nltk_file = '/home/user/nltk_data/tokenizers/punkt.zip'
+    if os.path.exists(nltk_file):
+        print('nltk punkt file exists in ', nltk_file)
+    else:
+        print("downloading punkt file")
+        nltk.download('punkt')
 # Define a function that takes some text as input and returns the number of tokens
 def token_count(text):
     # Import the Encoder class from bpe