Spaces:

sabssag
/

BlogPost

Sleeping

sabssag commited on Jul 22, 2024

Commit

ee5e01f

verified ·

1 Parent(s): 600c025

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -19,13 +19,17 @@ if text:
         # Generate text
         output = model.generate(
-            input_ids=encoded_input['input_ids'],
-            max_length=100,
-            num_return_sequences=1,
-            no_repeat_ngram_size=2,
-            top_p=0.95,
-            top_k=50
-        )
         # Decode generated text
         generated_text = tokenizer.decode(output[0], skip_special_tokens=True)

         # Generate text
         output = model.generate(
+	        input_ids=encoded_input,
+	        max_length=100,  # Specify the max length for the generated text
+	        num_return_sequences=1,  # Number of sequences to generate
+	        no_repeat_ngram_size=2,  # Avoid repeating n-grams of length 2
+	        top_k=50,  # Limits the sampling pool to top_k tokens
+	        top_p=0.95,  # Cumulative probability threshold for nucleus sampling
+	        temperature=0.7,  # Controls the randomness of predictions
+	        do_sample=True,  # Enable sampling
+	        attention_mask=encoded_input.new_ones(encoded_input.shape),
+	        pad_token_id=tokenizer.eos_token_id  # Use the end-of-sequence token as padding
+	    )
         # Decode generated text
         generated_text = tokenizer.decode(output[0], skip_special_tokens=True)