Spaces:

yuvarajareddy001
/

Content_Generator_Using_LLM

Sleeping

App Files Files Community

Content_Generator_Using_LLM / post_generator.py

yuvarajareddy001

Upload 6 files

28f56d3 verified 12 months ago

raw

history blame contribute delete

2.78 kB

	from langchain_groq import ChatGroq
	import os
	from dotenv import load_dotenv
	import pandas as pd
	import json


	class FewShotPosts:
	def __init__(self, file_path="processed_posts.json"):
	self.df = None
	self.unique_tags = None
	self.load_posts(file_path)

	def load_posts(self, file_path):
	with open(file_path, encoding="utf-8") as f:
	posts = json.load(f)
	self.df = pd.json_normalize(posts)
	self.df['length'] = self.df['line_count'].apply(self.categorize_length)
	# collect unique tags
	all_tags = self.df['tags'].apply(lambda x: x).sum()
	self.unique_tags = list(set(all_tags))

	def get_filtered_posts(self, length, language, tag):
	df_filtered = self.df[
	(self.df['tags'].apply(lambda tags: tag in tags)) & # Tags contain 'Influencer'
	(self.df['language'] == language) & # Language is 'English'
	(self.df['length'] == length) # Line count is less than 5
	]
	return df_filtered.to_dict(orient='records')

	def categorize_length(self, line_count):
	if line_count < 5:
	return "Short"
	elif 5 <= line_count <= 10:
	return "Medium"
	else:
	return "Long"

	def get_tags(self):
	return self.unique_tags


	load_dotenv()
	llm = ChatGroq(groq_api_key=os.getenv("GROQ_API_KEY"), model_name="llama-3.3-70b-versatile")
	few_shot = FewShotPosts()

	def get_length_str(length):
	if length == "Short":
	return "1 to 5 lines"
	if length == "Medium":
	return "6 to 10 lines"
	if length == "Long":
	return "11 to 15 lines"


	def generate_post(length, language, tag):
	prompt = get_prompt(length, language, tag)
	response = llm.invoke(prompt)
	return response.content


	def get_prompt(length, language, tag):
	length_str = get_length_str(length)

	prompt = f'''
	Generate a LinkedIn post using the below information. No preamble.

	1) Topic: {tag}
	2) Length: {length_str}
	3) Language: {language}
	If Language is Hinglish then it means it is a mix of Hindi and English.
	The script for the generated post should always be English.
	'''
	# prompt = prompt.format(post_topic=tag, post_length=length_str, post_language=language)

	examples = few_shot.get_filtered_posts(length, language, tag)

	if len(examples) > 0:
	prompt += "4) Use the writing style as per the following examples."

	for i, post in enumerate(examples):
	post_text = post['text']
	prompt += f'\n\n Example {i+1}: \n\n {post_text}'

	if i == 1: # Use max two samples
	break

	return prompt


	if __name__ == "__main__":
	print(generate_post("Medium", "English", "Mental Health"))