yamanavijayavardhan commited on
Commit
d497ee6
·
1 Parent(s): 688c89b

Fixed directory permissions and fasttext loading

Browse files
main.py CHANGED
@@ -2,10 +2,11 @@ import os
2
  import tempfile
3
  import nltk
4
 
5
- # Set up cache directories
6
  cache_dir = tempfile.mkdtemp()
7
  nltk_data_dir = os.path.join(cache_dir, 'nltk_data')
8
  gensim_data_dir = os.path.join(cache_dir, 'gensim-data')
 
9
 
10
  # Set environment variables
11
  os.environ['HF_HOME'] = cache_dir
@@ -14,9 +15,10 @@ os.environ['GENSIM_DATA_DIR'] = gensim_data_dir
14
  # Create directories with correct permissions
15
  os.makedirs(nltk_data_dir, exist_ok=True)
16
  os.makedirs(gensim_data_dir, exist_ok=True)
 
17
 
18
- # Add the custom directory to NLTK's search path BEFORE downloading
19
- nltk.data.path.insert(0, nltk_data_dir) # Insert at beginning of search path
20
 
21
  # Download required NLTK data
22
  try:
@@ -43,8 +45,8 @@ from similarity_check.llm_based_scoring.llm import llm_score
43
 
44
  app = Flask(__name__)
45
 
46
- UPLOAD_FOLDER = 'uploads'
47
- os.makedirs(UPLOAD_FOLDER, exist_ok=True)
48
 
49
  @app.route('/')
50
  def index():
 
2
  import tempfile
3
  import nltk
4
 
5
+ # Set up all cache and data directories in /tmp
6
  cache_dir = tempfile.mkdtemp()
7
  nltk_data_dir = os.path.join(cache_dir, 'nltk_data')
8
  gensim_data_dir = os.path.join(cache_dir, 'gensim-data')
9
+ upload_dir = os.path.join(cache_dir, 'uploads') # New upload directory in /tmp
10
 
11
  # Set environment variables
12
  os.environ['HF_HOME'] = cache_dir
 
15
  # Create directories with correct permissions
16
  os.makedirs(nltk_data_dir, exist_ok=True)
17
  os.makedirs(gensim_data_dir, exist_ok=True)
18
+ os.makedirs(upload_dir, exist_ok=True) # Create uploads directory
19
 
20
+ # Add the custom directory to NLTK's search path
21
+ nltk.data.path.insert(0, nltk_data_dir)
22
 
23
  # Download required NLTK data
24
  try:
 
45
 
46
  app = Flask(__name__)
47
 
48
+ # Use the new upload directory
49
+ UPLOAD_FOLDER = upload_dir # Changed from 'uploads' to upload_dir
50
 
51
  @app.route('/')
52
  def index():
similarity_check/semantic_meaning_check/semantic.py CHANGED
@@ -17,12 +17,20 @@ from all_models import models
17
  # Use custom directory for gensim data
18
  gensim_data_dir = os.getenv('GENSIM_DATA_DIR', tempfile.gettempdir())
19
 
20
- # Load fasttext with custom data directory
21
  try:
22
- fasttext = load('fasttext-wiki-news-subwords-300', data_dir=gensim_data_dir)
 
23
  except Exception as e:
24
  print(f"Error loading fasttext model: {e}")
25
- # Fallback similarity function if model fails to load
 
 
 
 
 
 
 
26
  def compute_scm(tokens1, tokens2, model):
27
  return 0.5 # Return default similarity score
28
 
 
17
  # Use custom directory for gensim data
18
  gensim_data_dir = os.getenv('GENSIM_DATA_DIR', tempfile.gettempdir())
19
 
20
+ # Load fasttext with error handling
21
  try:
22
+ print("Loading fasttext model...")
23
+ fasttext = load('fasttext-wiki-news-subwords-300')
24
  except Exception as e:
25
  print(f"Error loading fasttext model: {e}")
26
+ # Provide a fallback for similarity calculations
27
+ class DummyFasttext:
28
+ def __getitem__(self, word):
29
+ return np.zeros(300) # Return zero vector of size 300
30
+ def __contains__(self, word):
31
+ return True
32
+ fasttext = DummyFasttext()
33
+
34
  def compute_scm(tokens1, tokens2, model):
35
  return 0.5 # Return default similarity score
36