Spaces:

Ruurd
/

tini

Running on Zero

App Files Files

Ruurd commited on May 6

Commit

ec35c53

verified ·

1 Parent(s): a2125f4

Change to mask model

Browse files

Files changed (1) hide show

app.py +34 -34

app.py CHANGED Viewed

@@ -25,51 +25,51 @@ with open("token_probabilities.json") as f:
     token_probs_dict = json.load(f)
 token_probabilities = np.array([token_probs_dict[str(i)] for i in range(len(token_probs_dict))], dtype=np.float32)
-# def load_model():
-#     ckpt_path = hf_hub_download(
-#         repo_id="ruurd/tini_bi_m",
-#         filename="diffusion-model.pth",
-#         token=os.getenv("HF_TOKEN")
-#     )
-#     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-#     model = torch.load(ckpt_path, map_location=device)
-#     model = disable_dropout(model)
-#     model.to(device)
-#     model.eval()
-#     return model
 def load_model():
     ckpt_path = hf_hub_download(
-        repo_id="ruurd/tini_bi",
         filename="diffusion-model.pth",
-        token=os.getenv("HF_TOKEN"),
-        revision="5a22a8b6168466dbbf704efd00d8cbf2eee51426",
     )
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-    # Step 1: Create model from scratch
-    model = CustomTransformerModel(CustomTransformerConfig())
-    # Step 2: Load state_dict from full checkpoint
-    full_model = torch.load(ckpt_path, map_location=device)
-    # This handles both full model or just state_dict
-    try:
-        state_dict = full_model.state_dict()
-    except AttributeError:
-        state_dict = full_model  # already a state_dict
-    # Step 3: Load weights (might print mismatches)
-    missing, unexpected = model.load_state_dict(state_dict, strict=False)
-    print("Missing keys:", missing)
-    print("Unexpected keys:", unexpected)
-    model = disable_dropout(model)
-    model.to(device)
-    model.eval()
-    return model

     token_probs_dict = json.load(f)
 token_probabilities = np.array([token_probs_dict[str(i)] for i in range(len(token_probs_dict))], dtype=np.float32)
 def load_model():
     ckpt_path = hf_hub_download(
+        repo_id="ruurd/tini_bi_m",
         filename="diffusion-model.pth",
+        token=os.getenv("HF_TOKEN")
     )
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    model = torch.load(ckpt_path, map_location=device)
+    model = disable_dropout(model)
+    model.to(device)
+    model.eval()
+    return model
+# def load_model():
+#     ckpt_path = hf_hub_download(
+#         repo_id="ruurd/tini_bi",
+#         filename="diffusion-model.pth",
+#         token=os.getenv("HF_TOKEN"),
+#         revision="5a22a8b6168466dbbf704efd00d8cbf2eee51426",
+#     )
+#     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+#     # Step 1: Create model from scratch
+#     model = CustomTransformerModel(CustomTransformerConfig())
+#     # Step 2: Load state_dict from full checkpoint
+#     full_model = torch.load(ckpt_path, map_location=device)
+#     # This handles both full model or just state_dict
+#     try:
+#         state_dict = full_model.state_dict()
+#     except AttributeError:
+#         state_dict = full_model  # already a state_dict
+#     # Step 3: Load weights (might print mismatches)
+#     missing, unexpected = model.load_state_dict(state_dict, strict=False)
+#     print("Missing keys:", missing)
+#     print("Unexpected keys:", unexpected)
+#     model = disable_dropout(model)
+#     model.to(device)
+#     model.eval()
+#     return model