Simon Salmon
commited on
Commit
·
44fc0ac
1
Parent(s):
69063a5
Update app.py
Browse files
app.py
CHANGED
@@ -19,11 +19,14 @@ artist_name = st.text_input("Model", "BigSalmon/FormalBerta")
|
|
19 |
tokenizer = AutoTokenizer.from_pretrained("BigSalmon/FormalBerta")
|
20 |
model = AutoModelForMaskedLM.from_pretrained(artist_name)
|
21 |
|
|
|
|
|
22 |
with st.form(key='my_form'):
|
23 |
prompt = st.text_area(label='Enter sentence')
|
24 |
submit_button = st.form_submit_button(label='Submit')
|
25 |
|
26 |
if submit_button:
|
|
|
27 |
token_ids = tokenizer.encode(prompt, return_tensors='pt')
|
28 |
token_ids_tk = tokenizer.tokenize(prompt, return_tensors='pt')
|
29 |
masked_position = (token_ids.squeeze() == tokenizer.mask_token_id).nonzero()
|
@@ -35,7 +38,16 @@ with st.form(key='my_form'):
|
|
35 |
mask_hidden_state = last_hidden_state[mask_index]
|
36 |
idx = torch.topk(mask_hidden_state, k=100, dim=0)[1]
|
37 |
words = [tokenizer.decode(i.item()).strip() for i in idx]
|
38 |
-
|
39 |
-
|
40 |
-
|
41 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
tokenizer = AutoTokenizer.from_pretrained("BigSalmon/FormalBerta")
|
20 |
model = AutoModelForMaskedLM.from_pretrained(artist_name)
|
21 |
|
22 |
+
|
23 |
+
|
24 |
with st.form(key='my_form'):
|
25 |
prompt = st.text_area(label='Enter sentence')
|
26 |
submit_button = st.form_submit_button(label='Submit')
|
27 |
|
28 |
if submit_button:
|
29 |
+
a_list = []
|
30 |
token_ids = tokenizer.encode(prompt, return_tensors='pt')
|
31 |
token_ids_tk = tokenizer.tokenize(prompt, return_tensors='pt')
|
32 |
masked_position = (token_ids.squeeze() == tokenizer.mask_token_id).nonzero()
|
|
|
38 |
mask_hidden_state = last_hidden_state[mask_index]
|
39 |
idx = torch.topk(mask_hidden_state, k=100, dim=0)[1]
|
40 |
words = [tokenizer.decode(i.item()).strip() for i in idx]
|
41 |
+
a_list.append(words)
|
42 |
+
length = len(a_list)
|
43 |
+
middle_index = length//2
|
44 |
+
first_half = a_list[:middle_index]
|
45 |
+
second_half = a_list[middle_index:]
|
46 |
+
#st.write(words)
|
47 |
+
#col1= st.columns(1)
|
48 |
+
#with col1:
|
49 |
+
#st.write(words)
|
50 |
+
st.write(pd.DataFrame({
|
51 |
+
... 'first column': first_half,
|
52 |
+
... 'second column': second_half,
|
53 |
+
... }))
|