morethanair commited on
Commit
3d9f590
ยท
2 Parent(s): 35d2b81 6ca41f1

Merge pull request #3 from morethanair/fix/korean-embedding-model

Browse files
Files changed (2) hide show
  1. app.py +3 -3
  2. requirements.txt +1 -0
app.py CHANGED
@@ -84,7 +84,7 @@ def generate_youtube_embed_html(youtube_url: str, timestamp: str) -> str | None:
84
  PINECONE_API_KEY = os.getenv("PINECONE_API_KEY","pcsk_PZHLK_TRAvMCyNmJM4FKGCX7rbbY22a58fhnWYasx1mf3WL6sRasoASZXfsbnJYvCQ13w") # Load from environment variable
85
  PINECONE_ENV = os.getenv("PINECONE_ENV", "us-east-1")
86
  INDEX_NAME = "video-embeddings"
87
- EMBEDDING_MODEL = SentenceTransformer('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
88
 
89
  # OpenAI ์„ค์ •
90
  OPENAI_API_KEY = "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"
@@ -109,8 +109,8 @@ def init_pinecone():
109
  def load_embedding_model():
110
  """Sentence Transformer ๋ชจ๋ธ์„ ๋กœ๋“œํ•ฉ๋‹ˆ๋‹ค."""
111
  try:
112
- model = SentenceTransformer(EMBEDDING_MODEL)
113
- logger.info(f"Successfully loaded embedding model: {EMBEDDING_MODEL}")
114
  return model
115
  except Exception as e:
116
  st.error(f"์ž„๋ฒ ๋”ฉ ๋ชจ๋ธ ๋กœ๋”ฉ ์ค‘ ์˜ค๋ฅ˜ ๋ฐœ์ƒ: {e}")
 
84
  PINECONE_API_KEY = os.getenv("PINECONE_API_KEY","pcsk_PZHLK_TRAvMCyNmJM4FKGCX7rbbY22a58fhnWYasx1mf3WL6sRasoASZXfsbnJYvCQ13w") # Load from environment variable
85
  PINECONE_ENV = os.getenv("PINECONE_ENV", "us-east-1")
86
  INDEX_NAME = "video-embeddings"
87
+ EMBEDDING_MODEL_ID = 'jhgan/ko-sroberta-multitask' # ๋ชจ๋ธ ID๋กœ ๋ณ€๊ฒฝ
88
 
89
  # OpenAI ์„ค์ •
90
  OPENAI_API_KEY = "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"
 
109
  def load_embedding_model():
110
  """Sentence Transformer ๋ชจ๋ธ์„ ๋กœ๋“œํ•ฉ๋‹ˆ๋‹ค."""
111
  try:
112
+ model = SentenceTransformer(EMBEDDING_MODEL_ID) # ์ˆ˜์ •๋œ ๋ชจ๋ธ ID ์‚ฌ์šฉ
113
+ logger.info(f"Successfully loaded embedding model: {EMBEDDING_MODEL_ID}") # ์ˆ˜์ •๋œ ๋ชจ๋ธ ID ์‚ฌ์šฉ
114
  return model
115
  except Exception as e:
116
  st.error(f"์ž„๋ฒ ๋”ฉ ๋ชจ๋ธ ๋กœ๋”ฉ ์ค‘ ์˜ค๋ฅ˜ ๋ฐœ์ƒ: {e}")
requirements.txt CHANGED
@@ -5,3 +5,4 @@ pandas
5
  openai
6
  sentence-transformers==2.2.2
7
  torch==2.2.0
 
 
5
  openai
6
  sentence-transformers==2.2.2
7
  torch==2.2.0
8
+ huggingface-hub==0.0.8