From 613059737aaa2aafb3e9e1e86a9e232bb17e03a0 Mon Sep 17 00:00:00 2001 From: Nathan TeBlunthuis Date: Sun, 1 Dec 2024 15:25:18 -0800 Subject: [PATCH] set os environment for big machine --- ngrams/term_frequencies.py | 1 + 1 file changed, 1 insertion(+) diff --git a/ngrams/term_frequencies.py b/ngrams/term_frequencies.py index 741e914..1bb0f70 100755 --- a/ngrams/term_frequencies.py +++ b/ngrams/term_frequencies.py @@ -14,6 +14,7 @@ from nltk.util import ngrams import string from random import random from pathlib import Path +os.environ(["_JAVA_OPTIONS"]="-Xmx920g" # remove urls # taken from https://stackoverflow.com/questions/3809401/what-is-a-good-regular-expression-to-match-a-url