This was causing an error since we depend on punkt_tab.
@@ -9,7 +9,7 @@ import nltk
warnings.filterwarnings(
"ignore", category=FutureWarning, module="transformers.tokenization_utils_base"
)
-nltk.download("punkt", quiet=True)
+nltk.download("punkt_tab", quiet=True)
def getArticleText(url):