MrGanesh commited on
Commit
faf760a
·
1 Parent(s): 9d7cea2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -9
app.py CHANGED
@@ -5,13 +5,11 @@ import yake
5
  from keyphrase_vectorizers import KeyphraseCountVectorizer
6
 
7
  @st.cache(allow_output_mutation=True, suppress_st_warning=True, show_spinner=True)
8
- def load_model():
9
- model = KeyBERT("google/bigbird-pegasus-large-bigpatent")
10
- return model
11
 
12
- model = load_model()
13
-
14
-
15
  st.title("Patent Text Extractor")
16
  placeholder = st.empty()
17
  text_input = placeholder.text_area("Paste or write text", height=300)
@@ -39,11 +37,11 @@ button = st.button("Extract Keywords")
39
  kw_extractor = yake.KeywordExtractor(top=50)
40
  candidates = kw_extractor.extract_keywords(text_input)
41
  keyphrases = [candidate[0] for candidate in candidates]
42
- #kw_model = KeyBERT(model=model)
43
 
44
  #if keywords != []:
45
- keywords = model.extract_keywords(text_input,keyphrases, keyphrase_ngram_range=(1, 3),
46
- top_n=50,stop_words='english')
47
  if keywords != []:
48
  st.info("Extracted keywords")
49
  keywords = pd.DataFrame(keywords, columns=["Keyword", "Score"])
 
5
  from keyphrase_vectorizers import KeyphraseCountVectorizer
6
 
7
  @st.cache(allow_output_mutation=True, suppress_st_warning=True, show_spinner=True)
8
+ #def load_model():
9
+ #model = KeyBERT("google/bigbird-pegasus-large-bigpatent")
10
+ #return model
11
 
12
+ #model = load_model()
 
 
13
  st.title("Patent Text Extractor")
14
  placeholder = st.empty()
15
  text_input = placeholder.text_area("Paste or write text", height=300)
 
37
  kw_extractor = yake.KeywordExtractor(top=50)
38
  candidates = kw_extractor.extract_keywords(text_input)
39
  keyphrases = [candidate[0] for candidate in candidates]
40
+ kw_model = KeyBERT(model="google/bigbird-pegasus-large-bigpatent")
41
 
42
  #if keywords != []:
43
+ keywords = kw_model.extract_keywords(text_input,keyphrases, keyphrase_ngram_range=(1, 3),
44
+ top_n=50,stop_words='english',vectorizer=KeyphraseCountVectorizer())
45
  if keywords != []:
46
  st.info("Extracted keywords")
47
  keywords = pd.DataFrame(keywords, columns=["Keyword", "Score"])