Spaces:

dejanseo
/

gemini-tokens

Running

dejanseo commited on 7 days ago

Commit

b9c9f51

verified ·

1 Parent(s): 3b51041

Update src/streamlit_app.py

Files changed (1) hide show

src/streamlit_app.py CHANGED Viewed

@@ -10,11 +10,16 @@ st.title("Gemini Token Probabilities")
 # --- Load the SentencePiece tokenizer once ---
 @st.cache_resource
 def load_tokenizer():
-    model_dir  = "gemini-1.5-pro-002"
     model_path = os.path.join(model_dir, "gemini-1.5-pro-002.spm.model")
     if not os.path.isfile(model_path):
         st.error(f"Cannot find model at:\n{model_path}")
         st.stop()
     sp = spm.SentencePieceProcessor()
     sp.Load(model_path)
     return sp
@@ -57,11 +62,6 @@ if st.button("Tokenize"):
         })
         # 5) Display with progress bars (as percentages)
-        #
-        #    - format="percent" tells Streamlit to multiply the 0–1 value by 100 internally
-        #      and append “%” to the label.
-        #    - min_value=0 and max_value=1 anchor the range.
-        #st.markdown("### Tokenization Result (Global 0–100 %)")
         st.dataframe(
             df,
             use_container_width=True,

 # --- Load the SentencePiece tokenizer once ---
 @st.cache_resource
 def load_tokenizer():
+    # Determine the directory that this script lives in (i.e. src/)
+    here = os.path.dirname(__file__)
+    # Build the absolute path to the gemini-1.5-pro-002 folder inside src/
+    model_dir = os.path.join(here, "gemini-1.5-pro-002")
     model_path = os.path.join(model_dir, "gemini-1.5-pro-002.spm.model")
     if not os.path.isfile(model_path):
         st.error(f"Cannot find model at:\n{model_path}")
         st.stop()
     sp = spm.SentencePieceProcessor()
     sp.Load(model_path)
     return sp
         })
         # 5) Display with progress bars (as percentages)
         st.dataframe(
             df,
             use_container_width=True,