Commit
·
d497ee6
1
Parent(s):
688c89b
Fixed directory permissions and fasttext loading
Browse files
main.py
CHANGED
@@ -2,10 +2,11 @@ import os
|
|
2 |
import tempfile
|
3 |
import nltk
|
4 |
|
5 |
-
# Set up cache directories
|
6 |
cache_dir = tempfile.mkdtemp()
|
7 |
nltk_data_dir = os.path.join(cache_dir, 'nltk_data')
|
8 |
gensim_data_dir = os.path.join(cache_dir, 'gensim-data')
|
|
|
9 |
|
10 |
# Set environment variables
|
11 |
os.environ['HF_HOME'] = cache_dir
|
@@ -14,9 +15,10 @@ os.environ['GENSIM_DATA_DIR'] = gensim_data_dir
|
|
14 |
# Create directories with correct permissions
|
15 |
os.makedirs(nltk_data_dir, exist_ok=True)
|
16 |
os.makedirs(gensim_data_dir, exist_ok=True)
|
|
|
17 |
|
18 |
-
# Add the custom directory to NLTK's search path
|
19 |
-
nltk.data.path.insert(0, nltk_data_dir)
|
20 |
|
21 |
# Download required NLTK data
|
22 |
try:
|
@@ -43,8 +45,8 @@ from similarity_check.llm_based_scoring.llm import llm_score
|
|
43 |
|
44 |
app = Flask(__name__)
|
45 |
|
46 |
-
|
47 |
-
|
48 |
|
49 |
@app.route('/')
|
50 |
def index():
|
|
|
2 |
import tempfile
|
3 |
import nltk
|
4 |
|
5 |
+
# Set up all cache and data directories in /tmp
|
6 |
cache_dir = tempfile.mkdtemp()
|
7 |
nltk_data_dir = os.path.join(cache_dir, 'nltk_data')
|
8 |
gensim_data_dir = os.path.join(cache_dir, 'gensim-data')
|
9 |
+
upload_dir = os.path.join(cache_dir, 'uploads') # New upload directory in /tmp
|
10 |
|
11 |
# Set environment variables
|
12 |
os.environ['HF_HOME'] = cache_dir
|
|
|
15 |
# Create directories with correct permissions
|
16 |
os.makedirs(nltk_data_dir, exist_ok=True)
|
17 |
os.makedirs(gensim_data_dir, exist_ok=True)
|
18 |
+
os.makedirs(upload_dir, exist_ok=True) # Create uploads directory
|
19 |
|
20 |
+
# Add the custom directory to NLTK's search path
|
21 |
+
nltk.data.path.insert(0, nltk_data_dir)
|
22 |
|
23 |
# Download required NLTK data
|
24 |
try:
|
|
|
45 |
|
46 |
app = Flask(__name__)
|
47 |
|
48 |
+
# Use the new upload directory
|
49 |
+
UPLOAD_FOLDER = upload_dir # Changed from 'uploads' to upload_dir
|
50 |
|
51 |
@app.route('/')
|
52 |
def index():
|
similarity_check/semantic_meaning_check/semantic.py
CHANGED
@@ -17,12 +17,20 @@ from all_models import models
|
|
17 |
# Use custom directory for gensim data
|
18 |
gensim_data_dir = os.getenv('GENSIM_DATA_DIR', tempfile.gettempdir())
|
19 |
|
20 |
-
# Load fasttext with
|
21 |
try:
|
22 |
-
|
|
|
23 |
except Exception as e:
|
24 |
print(f"Error loading fasttext model: {e}")
|
25 |
-
#
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
26 |
def compute_scm(tokens1, tokens2, model):
|
27 |
return 0.5 # Return default similarity score
|
28 |
|
|
|
17 |
# Use custom directory for gensim data
|
18 |
gensim_data_dir = os.getenv('GENSIM_DATA_DIR', tempfile.gettempdir())
|
19 |
|
20 |
+
# Load fasttext with error handling
|
21 |
try:
|
22 |
+
print("Loading fasttext model...")
|
23 |
+
fasttext = load('fasttext-wiki-news-subwords-300')
|
24 |
except Exception as e:
|
25 |
print(f"Error loading fasttext model: {e}")
|
26 |
+
# Provide a fallback for similarity calculations
|
27 |
+
class DummyFasttext:
|
28 |
+
def __getitem__(self, word):
|
29 |
+
return np.zeros(300) # Return zero vector of size 300
|
30 |
+
def __contains__(self, word):
|
31 |
+
return True
|
32 |
+
fasttext = DummyFasttext()
|
33 |
+
|
34 |
def compute_scm(tokens1, tokens2, model):
|
35 |
return 0.5 # Return default similarity score
|
36 |
|