Spaces:

detoxioai
/

demo-chat-gpt

Paused

App Files Files Community

demo-chat-gpt / tests /scripts /simulate_attack_prompts.py

jchauhan

Initial Commit

6f58cbf over 1 year ago

raw

history blame contribute delete

10 kB

	import json
	import random
	import time
	from datetime import datetime
	import os
	import requests
	from datasets import load_dataset
	from time import sleep


	TEMPLATE_JSON=json.loads("""
	{
	"resource_spans": [
	{
	"scope_spans": [
	{
	"spans": [
	{
	"trace_id": "NQ01459b3A+aAHE+JwGWNQ==",
	"end_time_unix_nano": "1725721375827041000",
	"span_id": "0PCGpTowmVo=",
	"kind": "SPAN_KIND_CLIENT",
	"name": "openai.chat",
	"start_time_unix_nano": "1725721375188928425",
	"attributes": [
	{
	"value": {
	"string_value": "chat"
	},
	"key": "llm.request.type"
	},
	{
	"value": {
	"string_value": "OpenAI"
	},
	"key": "llm.vendor"
	},
	{
	"value": {
	"string_value": "gpt-3.5-turbo"
	},
	"key": "llm.request.model"
	},
	{
	"value": {
	"int_value": "100"
	},
	"key": "llm.request.max_tokens"
	},
	{
	"value": {
	"double_value": 0.5
	},
	"key": "llm.temperature"
	},
	{
	"value": {
	"string_value": "None"
	},
	"key": "llm.headers"
	},
	{
	"value": {
	"string_value": "system"
	},
	"key": "llm.prompts.0.role"
	},
	{
	"value": {
	"string_value": "You are Responsible AI assistant to the user. "
	},
	"key": "llm.prompts.0.content"
	},
	{
	"value": {
	"string_value": "user"
	},
	"key": "llm.prompts.1.role"
	},
	{
	"value": {
	"string_value": "hello this my test message"
	},
	"key": "llm.prompts.1.content"
	},
	{
	"value": {
	"string_value": "gpt-3.5-turbo-0125"
	},
	"key": "llm.response.model"
	},
	{
	"value": {
	"int_value": "35"
	},
	"key": "llm.usage.total_tokens"
	},
	{
	"value": {
	"int_value": "9"
	},
	"key": "llm.usage.completion_tokens"
	},
	{
	"value": {
	"int_value": "26"
	},
	"key": "llm.usage.prompt_tokens"
	},
	{
	"value": {
	"string_value": "stop"
	},
	"key": "llm.completions.0.finish_reason"
	},
	{
	"value": {
	"string_value": "assistant"
	},
	"key": "llm.completions.0.role"
	},
	{
	"value": {
	"string_value": "Hello! How can I assist you today?"
	},
	"key": "llm.completions.0.content"
	}
	],
	"status": {}
	}
	],
	"scope": {
	"name": "opentelemetry.instrumentation.openai.v1",
	"version": "0.10.4"
	}
	}
	],
	"resource": {
	"attributes": [
	{
	"value": {
	"string_value": "llm-chat-app"
	},
	"key": "service.name"
	}
	]
	}
	}
	]
	}

	""")


	def generate_random_id(size):
	return ''.join(random.choices('ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/=', k=size))


	def generate_json_from_template(template, provider, model, service_name, message):
	# Generate random trace_id and span_id
	trace_id = generate_random_id(22)
	span_id = generate_random_id(12)

	# Get current time in nanoseconds
	current_time_ns = int(time.time() * 1e9)

	# Update trace_id, span_id, times, provider, model, and service_name
	template['resource_spans'][0]['scope_spans'][0]['spans'][0]['trace_id'] = trace_id
	template['resource_spans'][0]['scope_spans'][0]['spans'][0]['span_id'] = span_id
	template['resource_spans'][0]['scope_spans'][0]['spans'][0]['start_time_unix_nano'] = str(current_time_ns)
	template['resource_spans'][0]['scope_spans'][0]['spans'][0]['end_time_unix_nano'] = str(current_time_ns + random.randint(100000000, 1000000000)) # Random duration

	# Update provider, model, and service_name information in attributes
	for attr in template['resource_spans'][0]['scope_spans'][0]['spans'][0]['attributes']:
	if attr['key'] == 'llm.vendor':
	attr['value']['string_value'] = provider
	elif attr['key'] == 'llm.request.model':
	attr['value']['string_value'] = model
	elif attr['key'] == 'llm.prompts.1.content': # Update user message content
	attr['value']['string_value'] = message

	# Update service_name in the resource attributes
	for attr in template['resource_spans'][0]['resource']['attributes']:
	if attr['key'] == 'service.name':
	attr['value']['string_value'] = service_name

	# Return the modified JSON
	return json.dumps(template)


	def send_json_to_remote(json_data):
	# Get environment variables
	base_url = os.getenv('TRACELOOP_BASE_URL')
	api_key = os.getenv('TRACELOOP_API_KEY')

	if not base_url or not api_key:
	raise EnvironmentError("TRACELOOP_BASE_URL or TRACELOOP_API_KEY is not set in environment variables.")

	# Set the headers and URL
	url = f"{base_url}/v1/traces"
	headers = {
	'Content-Type': 'application/json',
	'Authorization': f"Bearer {api_key}"
	}

	# Send the POST request
	response = requests.post(url, headers=headers, data=json_data)

	# Check the response status
	if response.status_code == 200:
	print("Data successfully sent!")
	else:
	print(f"Failed to send data. Status Code: {response.status_code}, Response: {response.text}")
	return (response.status_code, response.text)

	def send_message(message):
	_apps = ["fintechgpt", "healthgpt", "mydoc", "knowledge-centre", "assistantgpt"]

	# Compute exponential weights for service names
	factor = 2 # Control the steepness of the exponential decrease
	app_weights = [factor ** -i for i in range(len(_apps))]

	# Select a service_name randomly based on the exponential weights
	service_name = random.choices(_apps, weights=app_weights, k=1)[0]

	# Define providers and corresponding models with weights
	providers_models = {
	"Meta AI": (["LLaMA 65B", "LLaMA 33B"], 10),
	"Mistral": (["Mistral 7B"], 8),
	"Anthropic": (["Claude 3.5 Sonnet"], 15),
	"OpenAI": (["GPT-3", "GPT-3.5", "GPT-4", "GPT-4o"], 25),
	"Google": (["Gemini Ultra", "Gemini Pro", "Gemini Nano", "Lamda", "Palm"], 20),
	"Databricks": (["Dolly"], 5),
	"IBM AI": (["Watson NLP"], 5),
	"Azure AI": (["Azure OpenAI", "Custom GPT-3.5"], 7),
	"Snowflake": (["Snowflake GPT"], 3),
	"Krutrim": (["Krutrim LLM"], 2),
	"Baidu": (["Ernie 4.0"], 10),
	"Stability AI": (["StableLM 3B", "StableLM 7B"], 4),
	"Microsoft": (["Orca", "Phi-1"], 8)
	}

	# Extract providers and their weights
	providers = list(providers_models.keys())
	provider_weights = [providers_models[provider][1] for provider in providers]

	# Randomly select a provider based on weights
	selected_provider = random.choices(providers, weights=provider_weights, k=1)[0]

	# Randomly select a model from the selected provider
	selected_model = random.choice(providers_models[selected_provider][0])

	# Generate the JSON with the selected provider, model, and service_name
	output_json = generate_json_from_template(TEMPLATE_JSON, selected_provider, selected_model, service_name, message)

	# Send the JSON to the remote server
	return send_json_to_remote(output_json)


	def main():
	prompt_injection_dataset = load_dataset("deepset/prompt-injections")
	toxicity_prompts = load_dataset("allenai/real-toxicity-prompts")

	for i in range(2):
	# Collect messages
	prompt_injection_sample = prompt_injection_dataset["train"].shuffle(seed=42).select(range(10))
	toxicity_sample = toxicity_prompts["train"].shuffle(seed=42).select(range(10))
	plain_messages = ["this is test conversation" for _ in range(10)]

	# Combine all messages into a single list
	all_messages = [msg["text"] for msg in prompt_injection_sample] + \
	[msg["prompt"]["text"] for msg in toxicity_sample] + \
	plain_messages

	# Shuffle the combined list to mix message types
	random.shuffle(all_messages)

	# Send each message
	for message in all_messages:
	print(f"Sending Message {message}")
	send_message(message)
	sleep(random.uniform(2, 4)) # Random sleep between 0.5 to 2 seconds

	if __name__ == "__main__":
	main()