Spaces:

somosnlp-hackathon-2023
/

PodcastNER-GPTJ

Sleeping

DavidFM43 commited on Apr 10, 2023

Commit

0e95eb5

1 Parent(s): fe4bf72

Change gen output

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,6 +16,7 @@ tokenizer = AutoTokenizer.from_pretrained(peft_model_id)
 # Load the Lora model
 model = PeftModel.from_pretrained(model, peft_model_id)
 def gen_entities(text):
     text = f"<SP> text: {text}\n\n entities: "
@@ -23,7 +24,8 @@ def gen_entities(text):
     with torch.cuda.amp.autocast():
         output_tokens = model.generate(**batch, max_new_tokens=256, eos_token_id=50258)
-    return tokenizer.decode(output_tokens[0], skip_special_tokens=False)
 iface = gr.Interface(fn=gen_entities, inputs="text", outputs="text")

 # Load the Lora model
 model = PeftModel.from_pretrained(model, peft_model_id)
+model.eval()
 def gen_entities(text):
     text = f"<SP> text: {text}\n\n entities: "
     with torch.cuda.amp.autocast():
         output_tokens = model.generate(**batch, max_new_tokens=256, eos_token_id=50258)
+    # return tokenizer.decode(output_tokens, skip_special_tokens=False)
+    return tokenizer.batch_decode(output_tokens.detach().cpu().numpy(), skip_special_tokens=True)
 iface = gr.Interface(fn=gen_entities, inputs="text", outputs="text")