Spaces:

youngtsai
/

article_generator_2

Sleeping

App Files Files Community

youngtsai commited on Mar 20, 2024

Commit

67eb293

1 Parent(s): 8749812

def validate_article(generated_article, lesson_words, base_chars, original_word_count):

Browse files

Files changed (1) hide show

app.py +11 -3

app.py CHANGED Viewed

@@ -33,7 +33,7 @@ def extract_article_from_content(article_text):
 def validate_article(generated_article, lesson_words, base_chars, original_word_count):
     clean_article = "".join(char for char in generated_article if char not in "、，。！？；：「」『』（）《》【】'\n'")
-    not_every_new_word_is_used = not all(word in clean_article for word in lesson_words.split())
     word_out_of_range = not set(clean_article).issubset(set(lesson_words + base_chars))
     new_word_count = len(clean_article)
     word_count_error = not (0.9 * original_word_count <= new_word_count <= 1.1 * original_word_count)
@@ -104,6 +104,7 @@ def generate_new_article(lesson_words, original_article, original_word_count, ba
         not_every_new_word_is_used = validate_article_result['not_every_new_word_is_used']
         word_out_of_range = validate_article_result['word_out_of_range']
         word_count_error = validate_article_result['word_count_error']
         print("====validate_article====")
         print(f"not_every_new_word_is_used: {not_every_new_word_is_used}")
@@ -124,8 +125,15 @@ def generate_new_article(lesson_words, original_article, original_word_count, ba
             if word_count_error:
                 error_messages.append(f"The word count of the new article deviates more than 10% from the original ({original_word_count}).")
-            prompt += "\n".join(error_messages) + "\n"  # Append the error messages to the prompt for the next attempt
     return generated_article, validate_article_result

 def validate_article(generated_article, lesson_words, base_chars, original_word_count):
     clean_article = "".join(char for char in generated_article if char not in "、，。！？；：「」『』（）《》【】'\n'")
+    not_every_new_word_is_used = not all(word in clean_article for word in [char for char in lesson_words])
     word_out_of_range = not set(clean_article).issubset(set(lesson_words + base_chars))
     new_word_count = len(clean_article)
     word_count_error = not (0.9 * original_word_count <= new_word_count <= 1.1 * original_word_count)
         not_every_new_word_is_used = validate_article_result['not_every_new_word_is_used']
         word_out_of_range = validate_article_result['word_out_of_range']
         word_count_error = validate_article_result['word_count_error']
+        count_of_words_in_new_article = validate_article_result['count_of_words_in_new_article']
         print("====validate_article====")
         print(f"not_every_new_word_is_used: {not_every_new_word_is_used}")
             if word_count_error:
                 error_messages.append(f"The word count of the new article deviates more than 10% from the original ({original_word_count}).")
+            error_messages_str = "\n".join(error_messages) + "\n"  # Append the error messages to the prompt for the next attempt
+            prompt += f"""
+                The new article is {generated_article}.
+                word_count is {count_of_words_in_new_article}.
+                But the generated article is invalid. The following issues were found:
+                {error_messages_str}
+                please follow the summary of the key points and fix the errors to generate a new article.
+            """
+            print(f"Prompt for next attempt: {prompt}")
     return generated_article, validate_article_result