Spaces:

trysem
/

it2

Runtime error

App Files Files Community

trysem commited on Mar 30

Commit

c529ee8

verified ·

1 Parent(s): 92fd8d8

Create app.py

Browse files

Files changed (1) hide show

app.py +67 -0

app.py ADDED Viewed

	@@ -0,0 +1,67 @@

+import torch
+from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
+from IndicTransToolkit import IndicProcessor
+# recommended to run this on a gpu with flash_attn installed
+# don't set attn_implemetation if you don't have flash_attn
+DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+src_lang, tgt_lang = "eng_Latn", "hin_Deva"
+model_name = "ai4bharat/indictrans2-en-indic-1B"
+tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
+model = AutoModelForSeq2SeqLM.from_pretrained(
+    model_name,
+    trust_remote_code=True,
+    torch_dtype=torch.float16, # performance might slightly vary for bfloat16
+    attn_implementation="flash_attention_2"
+).to(DEVICE)
+ip = IndicProcessor(inference=True)
+input_sentences = [
+    "When I was young, I used to go to the park every day.",
+    "We watched a new movie last week, which was very inspiring.",
+    "If you had met me at that time, we would have gone out to eat.",
+    "My friend has invited me to his birthday party, and I will give him a gift.",
+]
+batch = ip.preprocess_batch(
+    input_sentences,
+    src_lang=src_lang,
+    tgt_lang=tgt_lang,
+)
+# Tokenize the sentences and generate input encodings
+inputs = tokenizer(
+    batch,
+    truncation=True,
+    padding="longest",
+    return_tensors="pt",
+    return_attention_mask=True,
+).to(DEVICE)
+# Generate translations using the model
+with torch.no_grad():
+    generated_tokens = model.generate(
+        **inputs,
+        use_cache=True,
+        min_length=0,
+        max_length=256,
+        num_beams=5,
+        num_return_sequences=1,
+    )
+# Decode the generated tokens into text
+with tokenizer.as_target_tokenizer():
+    generated_tokens = tokenizer.batch_decode(
+        generated_tokens.detach().cpu().tolist(),
+        skip_special_tokens=True,
+        clean_up_tokenization_spaces=True,
+    )
+# Postprocess the translations, including entity replacement
+translations = ip.postprocess_batch(generated_tokens, lang=tgt_lang)
+for input_sentence, translation in zip(input_sentences, translations):
+    print(f"{src_lang}: {input_sentence}")
+    print(f"{tgt_lang}: {translation}")