morethanair commited on
Commit
8e463d1
ยท
2 Parent(s): b59f879 3d9f590

Merge branch 'main' into az5u5j-codex/fix-error-with-korean-embedding-model

Browse files
Files changed (2) hide show
  1. app.py +3 -4
  2. requirements.txt +1 -0
app.py CHANGED
@@ -93,8 +93,7 @@ def generate_youtube_embed_html(youtube_url: str, timestamp: str) -> str | None:
93
  PINECONE_API_KEY = os.getenv("PINECONE_API_KEY","pcsk_PZHLK_TRAvMCyNmJM4FKGCX7rbbY22a58fhnWYasx1mf3WL6sRasoASZXfsbnJYvCQ13w") # Load from environment variable
94
  PINECONE_ENV = os.getenv("PINECONE_ENV", "us-east-1")
95
  INDEX_NAME = "video-embeddings"
96
- # Use a lightweight multilingual model that works well with Korean
97
- EMBEDDING_MODEL_NAME = "intfloat/multilingual-e5-small"
98
 
99
  # OpenAI ์„ค์ •
100
  OPENAI_API_KEY = "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"
@@ -119,8 +118,8 @@ def init_pinecone():
119
  def load_embedding_model():
120
  """Sentence Transformer ๋ชจ๋ธ์„ ๋กœ๋“œํ•ฉ๋‹ˆ๋‹ค."""
121
  try:
122
- model = SentenceTransformer(EMBEDDING_MODEL_NAME)
123
- logger.info(f"Successfully loaded embedding model: {EMBEDDING_MODEL_NAME}")
124
  return model
125
  except Exception as e:
126
  st.error(f"์ž„๋ฒ ๋”ฉ ๋ชจ๋ธ ๋กœ๋”ฉ ์ค‘ ์˜ค๋ฅ˜ ๋ฐœ์ƒ: {e}")
 
93
  PINECONE_API_KEY = os.getenv("PINECONE_API_KEY","pcsk_PZHLK_TRAvMCyNmJM4FKGCX7rbbY22a58fhnWYasx1mf3WL6sRasoASZXfsbnJYvCQ13w") # Load from environment variable
94
  PINECONE_ENV = os.getenv("PINECONE_ENV", "us-east-1")
95
  INDEX_NAME = "video-embeddings"
96
+ EMBEDDING_MODEL_ID = 'jhgan/ko-sroberta-multitask' # ๋ชจ๋ธ ID๋กœ ๋ณ€๊ฒฝ
 
97
 
98
  # OpenAI ์„ค์ •
99
  OPENAI_API_KEY = "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"
 
118
  def load_embedding_model():
119
  """Sentence Transformer ๋ชจ๋ธ์„ ๋กœ๋“œํ•ฉ๋‹ˆ๋‹ค."""
120
  try:
121
+ model = SentenceTransformer(EMBEDDING_MODEL_ID) # ์ˆ˜์ •๋œ ๋ชจ๋ธ ID ์‚ฌ์šฉ
122
+ logger.info(f"Successfully loaded embedding model: {EMBEDDING_MODEL_ID}") # ์ˆ˜์ •๋œ ๋ชจ๋ธ ID ์‚ฌ์šฉ
123
  return model
124
  except Exception as e:
125
  st.error(f"์ž„๋ฒ ๋”ฉ ๋ชจ๋ธ ๋กœ๋”ฉ ์ค‘ ์˜ค๋ฅ˜ ๋ฐœ์ƒ: {e}")
requirements.txt CHANGED
@@ -6,3 +6,4 @@ openai
6
  huggingface-hub
7
  sentence-transformers==2.2.2
8
  torch==2.2.0
 
 
6
  huggingface-hub
7
  sentence-transformers==2.2.2
8
  torch==2.2.0
9
+ huggingface-hub==0.0.8