llmopt-server / data /complexity_training_data.json
Shrot101's picture
feat: upgrade LLMOpt to V2 ML-powered architecture
eff2120
[
{
"query": "What is Python?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual"
},
{
"query": "What is the capital of France?",
"complexity": 0.04,
"tier": "trivial",
"domain": "factual"
},
{
"query": "Who invented the telephone?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual"
},
{
"query": "What does HTTP stand for?",
"complexity": 0.06,
"tier": "trivial",
"domain": "factual"
},
{
"query": "Translate 'hello' to Spanish",
"complexity": 0.07,
"tier": "trivial",
"domain": "translation"
},
{
"query": "What year was Python created?",
"complexity": 0.04,
"tier": "trivial",
"domain": "factual"
},
{
"query": "Is Java object-oriented?",
"complexity": 0.07,
"tier": "trivial",
"domain": "factual"
},
{
"query": "What is RAM?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual"
},
{
"query": "Summarize this paragraph: The quick brown fox...",
"complexity": 0.18,
"tier": "easy",
"domain": "summarization"
},
{
"query": "Explain what a variable is in programming",
"complexity": 0.15,
"tier": "easy",
"domain": "code"
},
{
"query": "What is the difference between a list and a tuple in Python?",
"complexity": 0.22,
"tier": "easy",
"domain": "code"
},
{
"query": "Write a simple hello world in JavaScript",
"complexity": 0.2,
"tier": "easy",
"domain": "code"
},
{
"query": "What is recursion? Give a simple example",
"complexity": 0.25,
"tier": "easy",
"domain": "code"
},
{
"query": "Translate this paragraph to French",
"complexity": 0.2,
"tier": "easy",
"domain": "translation"
},
{
"query": "Summarize the key points of agile methodology",
"complexity": 0.25,
"tier": "easy",
"domain": "summarization"
},
{
"query": "Explain binary search with a code example",
"complexity": 0.4,
"tier": "medium",
"domain": "code"
},
{
"query": "Write a Python function to check if a number is prime",
"complexity": 0.38,
"tier": "medium",
"domain": "code"
},
{
"query": "Compare REST and GraphQL APIs",
"complexity": 0.42,
"tier": "medium",
"domain": "reasoning"
},
{
"query": "Explain the CAP theorem in distributed systems",
"complexity": 0.48,
"tier": "medium",
"domain": "reasoning"
},
{
"query": "Write SQL to find duplicate rows in a table",
"complexity": 0.4,
"tier": "medium",
"domain": "code"
},
{
"query": "Explain gradient descent step by step",
"complexity": 0.5,
"tier": "medium",
"domain": "math"
},
{
"query": "What is the time complexity of quicksort? Explain with an example",
"complexity": 0.45,
"tier": "medium",
"domain": "code"
},
{
"query": "Design a rate limiter for an API",
"complexity": 0.62,
"tier": "hard",
"domain": "code"
},
{
"query": "Implement a LRU cache in Python",
"complexity": 0.6,
"tier": "hard",
"domain": "code"
},
{
"query": "Explain the Transformer architecture in detail",
"complexity": 0.7,
"tier": "hard",
"domain": "science"
},
{
"query": "Write a comprehensive tutorial on Docker and Kubernetes",
"complexity": 0.68,
"tier": "hard",
"domain": "code"
},
{
"query": "Analyze the pros and cons of microservices vs monoliths",
"complexity": 0.65,
"tier": "hard",
"domain": "reasoning"
},
{
"query": "Derive the backpropagation equations from first principles",
"complexity": 0.8,
"tier": "hard",
"domain": "math"
},
{
"query": "Design the Paxos consensus algorithm",
"complexity": 0.92,
"tier": "expert",
"domain": "reasoning"
},
{
"query": "Prove that P ≠ NP (or outline the key open problems)",
"complexity": 0.98,
"tier": "expert",
"domain": "math"
},
{
"query": "Design a distributed SQL database from scratch",
"complexity": 0.95,
"tier": "expert",
"domain": "code"
},
{
"query": "Implement a compiler for a simple language in Python",
"complexity": 0.9,
"tier": "expert",
"domain": "code"
},
{
"query": "Explain quantum entanglement and Bell's inequality with math",
"complexity": 0.88,
"tier": "expert",
"domain": "science"
},
{
"query": "Write a full-stack web app with React and FastAPI",
"complexity": 0.85,
"tier": "expert",
"domain": "code"
},
{
"query": "Analyze the ethical implications of AI in healthcare",
"complexity": 0.72,
"tier": "hard",
"domain": "reasoning"
},
{
"query": "Compare BERT and GPT architectures in depth",
"complexity": 0.75,
"tier": "hard",
"domain": "science"
},
{
"query": "What is async/await in Python?",
"complexity": 0.28,
"tier": "easy",
"domain": "code"
},
{
"query": "Explain SOLID principles with examples",
"complexity": 0.45,
"tier": "medium",
"domain": "code"
},
{
"query": "Write a regex to validate email addresses",
"complexity": 0.3,
"tier": "easy",
"domain": "code"
},
{
"query": "Design a URL shortener system like bit.ly",
"complexity": 0.7,
"tier": "hard",
"domain": "code"
},
{
"query": "Implement a red-black tree in C++",
"complexity": 0.8,
"tier": "hard",
"domain": "code"
},
{
"query": "Explain Bayesian inference with an example",
"complexity": 0.65,
"tier": "hard",
"domain": "math"
},
{
"query": "Write a neural network from scratch in numpy",
"complexity": 0.82,
"tier": "expert",
"domain": "code"
},
{
"query": "Translate this legal document to Spanish",
"complexity": 0.35,
"tier": "medium",
"domain": "translation"
},
{
"query": "Summarize this 50-page research paper",
"complexity": 0.45,
"tier": "medium",
"domain": "summarization"
},
{
"query": "Debate the pros and cons of nuclear energy",
"complexity": 0.6,
"tier": "hard",
"domain": "reasoning"
},
{
"query": "Write a creative short story about time travel",
"complexity": 0.42,
"tier": "medium",
"domain": "creative"
},
{
"query": "Explain what a closure is in JavaScript",
"complexity": 0.3,
"tier": "easy",
"domain": "code"
},
{
"query": "What is the difference between TCP and UDP?",
"complexity": 0.22,
"tier": "easy",
"domain": "factual"
},
{
"query": "Prove the Pythagorean theorem",
"complexity": 0.55,
"tier": "medium",
"domain": "math"
},
{
"query": "What is Python?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual",
"model": "gpt-3.5-turbo"
},
{
"query": "What is the capital of France?",
"complexity": 0.04,
"tier": "trivial",
"domain": "factual",
"model": "claude-3-haiku-20240307"
},
{
"query": "Who invented the telephone?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual",
"model": "llama3.2:3b"
},
{
"query": "What does HTTP stand for?",
"complexity": 0.06,
"tier": "trivial",
"domain": "factual",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'hello' to Spanish",
"complexity": 0.07,
"tier": "trivial",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "What year was Python created?",
"complexity": 0.04,
"tier": "trivial",
"domain": "factual",
"model": "gpt-4o-mini"
},
{
"query": "Is Java object-oriented?",
"complexity": 0.07,
"tier": "trivial",
"domain": "factual",
"model": "llama3.1:8b"
},
{
"query": "What is RAM?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "What is 2+2?",
"complexity": 0.02,
"tier": "trivial",
"domain": "math",
"model": "gpt-3.5-turbo"
},
{
"query": "Name one planet in our solar system",
"complexity": 0.03,
"tier": "trivial",
"domain": "science",
"model": "llama3.2:3b"
},
{
"query": "Summarize this: 'The quick brown fox jumps over the lazy dog.'",
"complexity": 0.18,
"tier": "easy",
"domain": "summarization",
"model": "gpt-4o-mini"
},
{
"query": "Explain what a variable is in programming",
"complexity": 0.15,
"tier": "easy",
"domain": "code",
"model": "claude-3-haiku-20240307"
},
{
"query": "What is the difference between a list and a tuple in Python?",
"complexity": 0.22,
"tier": "easy",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Write a simple hello world in JavaScript",
"complexity": 0.2,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "What is recursion? Give a simple example",
"complexity": 0.25,
"tier": "easy",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Translate 'Good morning, how are you?' to French",
"complexity": 0.2,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Summarize the key points of agile methodology",
"complexity": 0.25,
"tier": "easy",
"domain": "summarization",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Solve for x: 2x + 5 = 15",
"complexity": 0.12,
"tier": "easy",
"domain": "math",
"model": "gpt-3.5-turbo"
},
{
"query": "What is photosynthesis? Explain briefly",
"complexity": 0.17,
"tier": "easy",
"domain": "science",
"model": "gemini-1.5-flash"
},
{
"query": "Write a haiku about spring",
"complexity": 0.21,
"tier": "easy",
"domain": "creative",
"model": "llama3.1:70b"
},
{
"query": "Why is the sky blue?",
"complexity": 0.18,
"tier": "easy",
"domain": "reasoning",
"model": "mistral-large-latest"
},
{
"query": "Explain binary search with a code example",
"complexity": 0.4,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Write a Python function to check if a number is prime",
"complexity": 0.38,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Compare REST and GraphQL APIs",
"complexity": 0.42,
"tier": "medium",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "Explain the CAP theorem in distributed systems",
"complexity": 0.48,
"tier": "medium",
"domain": "reasoning",
"model": "gemini-1.5-pro"
},
{
"query": "Write SQL to find duplicate rows in a table",
"complexity": 0.4,
"tier": "medium",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Explain gradient descent step by step",
"complexity": 0.5,
"tier": "medium",
"domain": "math",
"model": "deepseek-chat"
},
{
"query": "What is the time complexity of quicksort? Explain with an example",
"complexity": 0.45,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Translate this technical document abstract to German",
"complexity": 0.35,
"tier": "medium",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Summarize the plot of '1984' by George Orwell",
"complexity": 0.37,
"tier": "medium",
"domain": "summarization",
"model": "mistral-large-latest"
},
{
"query": "Write a short story about a robot learning to dream",
"complexity": 0.44,
"tier": "medium",
"domain": "creative",
"model": "gpt-4o"
},
{
"query": "Explain the theory of relativity in simple terms",
"complexity": 0.46,
"tier": "medium",
"domain": "science",
"model": "gemini-1.5-pro"
},
{
"query": "What is the difference between supervised and unsupervised learning?",
"complexity": 0.36,
"tier": "medium",
"domain": "factual",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Solve the quadratic equation: x^2 - 5x + 6 = 0",
"complexity": 0.32,
"tier": "medium",
"domain": "math",
"model": "llama3.1:70b"
},
{
"query": "Design a rate limiter for an API",
"complexity": 0.62,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Implement an LRU cache in Python",
"complexity": 0.6,
"tier": "hard",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the Transformer architecture in detail",
"complexity": 0.7,
"tier": "hard",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Write a comprehensive tutorial on Docker and Kubernetes",
"complexity": 0.68,
"tier": "hard",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Analyze the pros and cons of microservices vs monoliths",
"complexity": 0.65,
"tier": "hard",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "Derive the backpropagation equations from first principles",
"complexity": 0.8,
"tier": "expert",
"domain": "math",
"model": "deepseek-chat"
},
{
"query": "Prove that the square root of 2 is irrational",
"complexity": 0.58,
"tier": "hard",
"domain": "math",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate this legal contract summary to Japanese",
"complexity": 0.55,
"tier": "hard",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Summarize the latest advances in quantum computing (2023-2024)",
"complexity": 0.66,
"tier": "hard",
"domain": "summarization",
"model": "gemini-1.5-pro"
},
{
"query": "Write a poem in the style of Edgar Allan Poe about AI",
"complexity": 0.63,
"tier": "hard",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the ethics of autonomous weapons systems",
"complexity": 0.67,
"tier": "hard",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "What is the role of the Golgi apparatus in cells?",
"complexity": 0.42,
"tier": "medium",
"domain": "science",
"model": "mistral-large-latest"
},
{
"query": "Write a script to scrape a website and extract all links",
"complexity": 0.52,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the concept of idempotency in REST APIs",
"complexity": 0.39,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Describe the water cycle for a 10-year-old",
"complexity": 0.19,
"tier": "easy",
"domain": "science",
"model": "llama3.2:3b"
},
{
"query": "What is a neural network? Give a simple analogy",
"complexity": 0.24,
"tier": "easy",
"domain": "science",
"model": "claude-3-haiku-20240307"
},
{
"query": "Solve: If a train travels 60 mph for 2 hours, how far does it go?",
"complexity": 0.08,
"tier": "trivial",
"domain": "math",
"model": "gpt-3.5-turbo"
},
{
"query": "Name three data types in Python",
"complexity": 0.06,
"tier": "trivial",
"domain": "code",
"model": "llama3.2:3b"
},
{
"query": "Translate 'Thank you very much' to Italian",
"complexity": 0.07,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "What is the main ingredient in guacamole?",
"complexity": 0.03,
"tier": "trivial",
"domain": "factual",
"model": "mistral-small-latest"
},
{
"query": "Write a for loop that prints numbers 1 to 10 in Python",
"complexity": 0.16,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Explain what a deadlock is in concurrency",
"complexity": 0.33,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Compare socialism and capitalism",
"complexity": 0.47,
"tier": "medium",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "What is the significance of the Higgs boson discovery?",
"complexity": 0.56,
"tier": "medium",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Write a SQL query to join three tables",
"complexity": 0.41,
"tier": "medium",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Create a simple JavaScript function that returns the current date",
"complexity": 0.14,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "What is the Pythagorean theorem? Provide an example",
"complexity": 0.23,
"tier": "easy",
"domain": "math",
"model": "gemini-1.5-flash"
},
{
"query": "Summarize the main ideas of Stoic philosophy",
"complexity": 0.49,
"tier": "medium",
"domain": "summarization",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Write a recipe for chocolate chip cookies in poetic form",
"complexity": 0.51,
"tier": "medium",
"domain": "creative",
"model": "gpt-4o-mini"
},
{
"query": "Explain the difference between CPU and GPU",
"complexity": 0.27,
"tier": "easy",
"domain": "factual",
"model": "llama3.1:8b"
},
{
"query": "Solve: What is the derivative of x^3?",
"complexity": 0.31,
"tier": "medium",
"domain": "math",
"model": "deepseek-chat"
},
{
"query": "Design a simple task scheduler in Python",
"complexity": 0.59,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Explain the concept of 'impostor syndrome' in the workplace",
"complexity": 0.34,
"tier": "easy",
"domain": "reasoning",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "What are the three laws of robotics?",
"complexity": 0.09,
"tier": "trivial",
"domain": "science",
"model": "gpt-3.5-turbo"
},
{
"query": "Translate 'The food was delicious' to Mandarin Chinese",
"complexity": 0.26,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Write a CSS snippet to center a div",
"complexity": 0.13,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "Explain the Drake equation",
"complexity": 0.44,
"tier": "medium",
"domain": "science",
"model": "llama3.1:70b"
},
{
"query": "What is the difference between error and exception in programming?",
"complexity": 0.21,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Solve: 15% of 200",
"complexity": 0.05,
"tier": "trivial",
"domain": "math",
"model": "llama3.2:3b"
},
{
"query": "Write a haiku about debugging",
"complexity": 0.28,
"tier": "easy",
"domain": "creative",
"model": "claude-3-haiku-20240307"
},
{
"query": "Explain the concept of 'technical debt'",
"complexity": 0.37,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "What are the benefits of using TypeScript over JavaScript?",
"complexity": 0.29,
"tier": "easy",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Summarize the plot of 'The Great Gatsby' in one paragraph",
"complexity": 0.38,
"tier": "medium",
"domain": "summarization",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate the following error message to Spanish: 'File not found'",
"complexity": 0.08,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Write a Python decorator that measures execution time",
"complexity": 0.55,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the concept of 'virtue ethics'",
"complexity": 0.46,
"tier": "medium",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "What is the function of the mitochondria?",
"complexity": 0.11,
"tier": "easy",
"domain": "science",
"model": "llama3.1:8b"
},
{
"query": "Solve for x: log(x) = 2",
"complexity": 0.3,
"tier": "medium",
"domain": "math",
"model": "gemini-1.5-pro"
},
{
"query": "Design a simple REST API for a todo list",
"complexity": 0.57,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the difference between let, const, and var in JavaScript",
"complexity": 0.23,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Write a limerick about a programmer",
"complexity": 0.32,
"tier": "easy",
"domain": "creative",
"model": "llama3.1:70b"
},
{
"query": "What is the greenhouse effect? Explain simply",
"complexity": 0.19,
"tier": "easy",
"domain": "science",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'I would like to book a flight' to French",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "What is the difference between a stack and a queue?",
"complexity": 0.24,
"tier": "easy",
"domain": "code",
"model": "gpt-3.5-turbo"
},
{
"query": "Explain the concept of 'opportunity cost' in economics",
"complexity": 0.28,
"tier": "easy",
"domain": "reasoning",
"model": "gemini-1.5-flash"
},
{
"query": "Write a binary search algorithm in Python",
"complexity": 0.43,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Summarize the key innovations of the Renaissance",
"complexity": 0.41,
"tier": "medium",
"domain": "summarization",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Solve: What is the area of a circle with radius 5?",
"complexity": 0.1,
"tier": "easy",
"domain": "math",
"model": "llama3.2:3b"
},
{
"query": "Create a simple HTML page with a button",
"complexity": 0.12,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Explain the concept of 'black swan events'",
"complexity": 0.45,
"tier": "medium",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "What is CRISPR used for?",
"complexity": 0.22,
"tier": "easy",
"domain": "science",
"model": "gemini-1.5-pro"
},
{
"query": "Write a regular expression to match an email address",
"complexity": 0.34,
"tier": "medium",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Translate 'Where is the nearest hospital?' to German",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "claude-3-haiku-20240307"
},
{
"query": "Write a short story about a character who wakes up with amnesia",
"complexity": 0.49,
"tier": "medium",
"domain": "creative",
"model": "llama3.1:70b"
},
{
"query": "Explain the difference between correlation and causation",
"complexity": 0.33,
"tier": "medium",
"domain": "reasoning",
"model": "deepseek-chat"
},
{
"query": "What is a SAT solver used for in computer science?",
"complexity": 0.52,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "What is an API?",
"complexity": 0.06,
"tier": "trivial",
"domain": "factual",
"model": "llama3.2:3b"
},
{
"query": "Who wrote 'Romeo and Juliet'?",
"complexity": 0.04,
"tier": "trivial",
"domain": "factual",
"model": "gpt-3.5-turbo"
},
{
"query": "What does CSS stand for?",
"complexity": 0.05,
"tier": "trivial",
"domain": "factual",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'good night' to German",
"complexity": 0.06,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "What is the square root of 64?",
"complexity": 0.03,
"tier": "trivial",
"domain": "math",
"model": "mistral-small-latest"
},
{
"query": "What color is the sky on a clear day?",
"complexity": 0.02,
"tier": "trivial",
"domain": "science",
"model": "llama3.1:8b"
},
{
"query": "What does SQL stand for?",
"complexity": 0.06,
"tier": "trivial",
"domain": "factual",
"model": "gpt-4o-mini"
},
{
"query": "Name one mammal that can fly",
"complexity": 0.04,
"tier": "trivial",
"domain": "science",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Translate 'I love you' to French",
"complexity": 0.05,
"tier": "trivial",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "What is the largest ocean on Earth?",
"complexity": 0.03,
"tier": "trivial",
"domain": "factual",
"model": "gpt-3.5-turbo"
},
{
"query": "Explain what a function is in programming",
"complexity": 0.16,
"tier": "easy",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Write a simple for loop in C++ that prints 0 to 9",
"complexity": 0.19,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "What is the difference between '==' and '===' in JavaScript?",
"complexity": 0.21,
"tier": "easy",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Translate 'The weather is nice today' to Italian",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Summarize the water cycle in two sentences",
"complexity": 0.17,
"tier": "easy",
"domain": "summarization",
"model": "claude-3-haiku-20240307"
},
{
"query": "Solve for y: 3y - 7 = 11",
"complexity": 0.11,
"tier": "easy",
"domain": "math",
"model": "llama3.2:3b"
},
{
"query": "Why do we have seasons?",
"complexity": 0.19,
"tier": "easy",
"domain": "science",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a two-line poem about the moon",
"complexity": 0.14,
"tier": "easy",
"domain": "creative",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Explain why ice floats on water",
"complexity": 0.2,
"tier": "easy",
"domain": "reasoning",
"model": "gemini-1.5-pro"
},
{
"query": "What is a stack overflow in programming?",
"complexity": 0.23,
"tier": "easy",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Write a Python function to find the maximum of three numbers",
"complexity": 0.27,
"tier": "easy",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "What is the difference between a class and an object?",
"complexity": 0.25,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'Where is the bathroom?' to Spanish",
"complexity": 0.12,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:70b"
},
{
"query": "Summarize the main idea of the movie 'Inception'",
"complexity": 0.29,
"tier": "easy",
"domain": "summarization",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Solve: What is 25% of 80?",
"complexity": 0.08,
"tier": "trivial",
"domain": "math",
"model": "gpt-4o"
},
{
"query": "Write a short story about a lost key",
"complexity": 0.35,
"tier": "medium",
"domain": "creative",
"model": "gpt-4o"
},
{
"query": "Explain how a memoization works with an example in JavaScript",
"complexity": 0.44,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Compare TCP and UDP protocols in detail",
"complexity": 0.43,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "What is the halting problem? Why is it important?",
"complexity": 0.51,
"tier": "medium",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "Derive the formula for the area of a circle",
"complexity": 0.37,
"tier": "medium",
"domain": "math",
"model": "gemini-1.5-pro"
},
{
"query": "Explain the second law of thermodynamics",
"complexity": 0.53,
"tier": "medium",
"domain": "science",
"model": "llama3.1:70b"
},
{
"query": "Write a SQL query to get the top 5 highest paid employees",
"complexity": 0.39,
"tier": "medium",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Translate this business email to Japanese: 'Dear Sir, we appreciate your prompt response.'",
"complexity": 0.48,
"tier": "medium",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Summarize the plot of 'The Odyssey' in 100 words",
"complexity": 0.42,
"tier": "medium",
"domain": "summarization",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Write a sonnet about artificial intelligence",
"complexity": 0.54,
"tier": "medium",
"domain": "creative",
"model": "deepseek-chat"
},
{
"query": "Explain the concept of race conditions in multithreading",
"complexity": 0.46,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "What is the difference between deep learning and traditional machine learning?",
"complexity": 0.47,
"tier": "medium",
"domain": "science",
"model": "gemini-1.5-pro"
},
{
"query": "Solve the integral of x^2 dx",
"complexity": 0.36,
"tier": "medium",
"domain": "math",
"model": "llama3.1:8b"
},
{
"query": "Implement a binary tree traversal in Python (in-order)",
"complexity": 0.56,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Design a simple load balancer algorithm",
"complexity": 0.58,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Write a regular expression to validate a US phone number",
"complexity": 0.41,
"tier": "medium",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "Explain the prisoner's dilemma and its implications",
"complexity": 0.49,
"tier": "medium",
"domain": "reasoning",
"model": "deepseek-chat"
},
{
"query": "What is the Golden Ratio? Provide examples",
"complexity": 0.34,
"tier": "medium",
"domain": "math",
"model": "gpt-4o-mini"
},
{
"query": "Translate a medical prescription summary to German",
"complexity": 0.52,
"tier": "medium",
"domain": "translation",
"model": "llama3.1:70b"
},
{
"query": "Summarize the key arguments in Plato's 'Republic'",
"complexity": 0.57,
"tier": "hard",
"domain": "summarization",
"model": "gpt-4o"
},
{
"query": "Write a dark fantasy short story about a cursed mirror",
"complexity": 0.64,
"tier": "hard",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Implement a concurrent web scraper in Python with asyncio",
"complexity": 0.69,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the proof of Fermat's Last Theorem at a high level",
"complexity": 0.78,
"tier": "hard",
"domain": "math",
"model": "gpt-4o"
},
{
"query": "Analyze the performance implications of columnar vs row-based storage",
"complexity": 0.66,
"tier": "hard",
"domain": "reasoning",
"model": "gemini-1.5-pro"
},
{
"query": "Describe the architecture of a distributed key-value store like DynamoDB",
"complexity": 0.72,
"tier": "hard",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "What is the Bellman equation in reinforcement learning?",
"complexity": 0.63,
"tier": "hard",
"domain": "science",
"model": "mistral-large-latest"
},
{
"query": "Translate a complex legal disclaimer to French",
"complexity": 0.61,
"tier": "hard",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Design a real-time chat system supporting 1 million concurrent users",
"complexity": 0.75,
"tier": "hard",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the concept of zero-knowledge proofs",
"complexity": 0.7,
"tier": "hard",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Write a detailed guide on optimizing Python code with C extensions",
"complexity": 0.68,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Prove that there are infinitely many prime numbers",
"complexity": 0.59,
"tier": "hard",
"domain": "math",
"model": "gemini-1.5-pro"
},
{
"query": "What is the 'butterfly effect' in chaos theory?",
"complexity": 0.55,
"tier": "medium",
"domain": "science",
"model": "llama3.1:8b"
},
{
"query": "Write a memoization decorator in Python",
"complexity": 0.53,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Explain the difference between a process and a thread",
"complexity": 0.31,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'Congratulations on your new job' to Portuguese",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "What is the role of the nucleus in a cell?",
"complexity": 0.15,
"tier": "easy",
"domain": "science",
"model": "gemini-1.5-flash"
},
{
"query": "Write a Java program to reverse a string",
"complexity": 0.26,
"tier": "easy",
"domain": "code",
"model": "llama3.2:3b"
},
{
"query": "Solve for x: 4x^2 - 16 = 0",
"complexity": 0.28,
"tier": "easy",
"domain": "math",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a haiku about winter",
"complexity": 0.15,
"tier": "easy",
"domain": "creative",
"model": "claude-3-haiku-20240307"
},
{
"query": "Explain why the sky is red at sunset",
"complexity": 0.27,
"tier": "easy",
"domain": "reasoning",
"model": "gpt-4o-mini"
},
{
"query": "What is an abstract class in Java?",
"complexity": 0.29,
"tier": "easy",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Write a simple HTML form with two input fields",
"complexity": 0.18,
"tier": "easy",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Translate 'I need a doctor' to Korean",
"complexity": 0.17,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Summarize the plot of 'Hamlet' in three sentences",
"complexity": 0.32,
"tier": "easy",
"domain": "summarization",
"model": "gpt-4o"
},
{
"query": "What is the difference between GET and POST in HTTP?",
"complexity": 0.22,
"tier": "easy",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Write a C program to calculate factorial using recursion",
"complexity": 0.4,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the concept of 'sharding' in databases",
"complexity": 0.48,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "What is the difference between L1 and L2 regularization?",
"complexity": 0.54,
"tier": "medium",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Solve the system of equations: 2x + y = 10, x - y = 2",
"complexity": 0.33,
"tier": "medium",
"domain": "math",
"model": "llama3.1:70b"
},
{
"query": "Write a Python script to download an image from a URL",
"complexity": 0.36,
"tier": "medium",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Explain the Turing test and its criticisms",
"complexity": 0.45,
"tier": "medium",
"domain": "reasoning",
"model": "gemini-1.5-pro"
},
{
"query": "Translate 'The system is currently offline' to Russian",
"complexity": 0.39,
"tier": "medium",
"domain": "translation",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Summarize the main findings of the Human Genome Project",
"complexity": 0.5,
"tier": "medium",
"domain": "science",
"model": "gpt-4o-mini"
},
{
"query": "Write a villanelle about lost time",
"complexity": 0.62,
"tier": "hard",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Implement a connection pool in Go",
"complexity": 0.71,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the concept of 'eventual consistency' in distributed systems",
"complexity": 0.65,
"tier": "hard",
"domain": "reasoning",
"model": "gpt-4o"
},
{
"query": "Derive the Black-Scholes equation for option pricing",
"complexity": 0.85,
"tier": "expert",
"domain": "math",
"model": "gpt-4o"
},
{
"query": "Design a distributed consensus protocol like Raft",
"complexity": 0.88,
"tier": "expert",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Explain the holographic principle in theoretical physics",
"complexity": 0.92,
"tier": "expert",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Write a full compiler frontend for a small language in Rust",
"complexity": 0.95,
"tier": "expert",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Prove the Riemann Hypothesis (outline the main approach)",
"complexity": 0.99,
"tier": "expert",
"domain": "math",
"model": "gpt-4o"
},
{
"query": "Analyze the security of the TLS 1.3 handshake",
"complexity": 0.82,
"tier": "expert",
"domain": "reasoning",
"model": "llama3.1:70b"
},
{
"query": "Implement a B+ tree index from scratch",
"complexity": 0.87,
"tier": "expert",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate a complex patent document to Chinese",
"complexity": 0.76,
"tier": "hard",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "What is the difference between Bayesian and frequentist statistics?",
"complexity": 0.67,
"tier": "hard",
"domain": "math",
"model": "deepseek-chat"
},
{
"query": "Write a high-performance WebSocket server in C++",
"complexity": 0.79,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Explain the many-worlds interpretation of quantum mechanics",
"complexity": 0.73,
"tier": "hard",
"domain": "science",
"model": "llama3.1:70b"
},
{
"query": "Design a URL shortening service like TinyURL (full design)",
"complexity": 0.69,
"tier": "hard",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Prove the central limit theorem",
"complexity": 0.84,
"tier": "expert",
"domain": "math",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Write a distributed task queue using Redis",
"complexity": 0.74,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the concept of 'transfer learning' in neural networks",
"complexity": 0.56,
"tier": "medium",
"domain": "science",
"model": "gpt-4o"
},
{
"query": "Solve the traveling salesman problem using dynamic programming",
"complexity": 0.77,
"tier": "hard",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Translate a software license agreement to Spanish",
"complexity": 0.58,
"tier": "hard",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Write a detailed critique of the OpenAI GPT-4 architecture",
"complexity": 0.7,
"tier": "hard",
"domain": "reasoning",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "What is the curse of dimensionality in machine learning?",
"complexity": 0.51,
"tier": "medium",
"domain": "science",
"model": "gemini-1.5-pro"
},
{
"query": "Fix this Python code: `def add(a,b): return a-b` – it should add, not subtract.",
"complexity": 0.11,
"tier": "easy",
"domain": "code",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a Python one-liner to reverse a string.",
"complexity": 0.13,
"tier": "easy",
"domain": "code",
"model": "claude-3-haiku-20240307"
},
{
"query": "Why does this JavaScript code print 'undefined'? `var x; console.log(x);`",
"complexity": 0.09,
"tier": "trivial",
"domain": "code",
"model": "llama3.2:3b"
},
{
"query": "Implement a function `is_palindrome(s)` in Python that ignores spaces and case.",
"complexity": 0.32,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Debug this SQL: `SELECT * FORM users WHERE name = 'John';`",
"complexity": 0.07,
"tier": "trivial",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "Write a recursive function to compute the nth Fibonacci number in Java.",
"complexity": 0.34,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "What is the output of `console.log(1 + '2' + 3)` in JavaScript? Explain.",
"complexity": 0.15,
"tier": "easy",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Write a C function to swap two integers using pointers.",
"complexity": 0.28,
"tier": "easy",
"domain": "code",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Fix the memory leak in this C++ snippet: `int* p = new int; p = new int; delete p;`",
"complexity": 0.45,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Implement a queue using two stacks in Python.",
"complexity": 0.52,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Write a regex to extract all email addresses from a text.",
"complexity": 0.38,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Why does this infinite loop happen? `for i in range(10): i -= 1`",
"complexity": 0.21,
"tier": "easy",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Write a Python decorator that caches return values of a function.",
"complexity": 0.58,
"tier": "hard",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Convert this list comprehension to a for loop: `[x**2 for x in range(10) if x%2==0]`",
"complexity": 0.19,
"tier": "easy",
"domain": "code",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a SQL query to find employees who earn more than their managers.",
"complexity": 0.44,
"tier": "medium",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Implement a binary search in a sorted array (any language).",
"complexity": 0.36,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Debug this Python: `print('Hello' + 123)` – what error and how to fix?",
"complexity": 0.1,
"tier": "trivial",
"domain": "code",
"model": "llama3.2:3b"
},
{
"query": "Write a function that merges two sorted lists into one sorted list (O(n)).",
"complexity": 0.41,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Explain why `[1,2,3].map(parseInt)` returns `[1, NaN, NaN]` in JavaScript.",
"complexity": 0.47,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Write a simple HTML page that fetches data from a REST API and displays it.",
"complexity": 0.39,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Implement a singleton pattern in Python.",
"complexity": 0.35,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Fix the race condition in this multi‑threaded Python code (pseudo).",
"complexity": 0.63,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Write a recursive descent parser for simple arithmetic expressions (+, -, *, /).",
"complexity": 0.71,
"tier": "hard",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Why does this C code crash? `int arr[5]; arr[10] = 42;`",
"complexity": 0.08,
"tier": "trivial",
"domain": "code",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a Python generator that yields the Fibonacci sequence infinitely.",
"complexity": 0.33,
"tier": "medium",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Implement an LRU cache using `OrderedDict` in Python.",
"complexity": 0.59,
"tier": "hard",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "What does `*args` and `**kwargs` do in Python? Give an example.",
"complexity": 0.25,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "Write a JavaScript function that throttles another function (limit calls per second).",
"complexity": 0.55,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Debug this SQL injection vulnerability: `\"SELECT * FROM users WHERE id = \" + user_id`",
"complexity": 0.3,
"tier": "easy",
"domain": "code",
"model": "claude-3-haiku-20240307"
},
{
"query": "Implement a simple HTTP server in Python using `sockets`.",
"complexity": 0.62,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain the output: `console.log([] + []); console.log([] + {}); console.log({} + []);`",
"complexity": 0.49,
"tier": "medium",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Write a C++ program that reverses a linked list.",
"complexity": 0.46,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Convert this `try/except` to using `contextlib.suppress` in Python.",
"complexity": 0.27,
"tier": "easy",
"domain": "code",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Implement the Sieve of Eratosthenes in Java.",
"complexity": 0.42,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Why does `0.1 + 0.2 !== 0.3` in JavaScript? Explain floating point.",
"complexity": 0.35,
"tier": "medium",
"domain": "code",
"model": "mistral-large-latest"
},
{
"query": "Write a Python script to find duplicate files in a directory (by hash).",
"complexity": 0.51,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Fix the deadlock in this pseudocode: two threads lock A then B, and B then A.",
"complexity": 0.66,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Implement a simple event emitter in JavaScript (Node.js style).",
"complexity": 0.48,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "What is tail recursion? Convert this factorial to tail‑recursive: `def fact(n): return 1 if n==0 else n*fact(n-1)`",
"complexity": 0.37,
"tier": "medium",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Write a Go routine that computes the sum of squares concurrently.",
"complexity": 0.54,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'The server is down' to Arabic",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Summarize the concept of 'reference counting' in memory management.",
"complexity": 0.28,
"tier": "easy",
"domain": "summarization",
"model": "claude-3-haiku-20240307"
},
{
"query": "Solve `∫ x e^x dx`",
"complexity": 0.43,
"tier": "medium",
"domain": "math",
"model": "deepseek-chat"
},
{
"query": "Explain why black holes evaporate (Hawking radiation).",
"complexity": 0.61,
"tier": "hard",
"domain": "science",
"model": "gpt-4o"
},
{
"query": "Write a haiku about a segfault",
"complexity": 0.22,
"tier": "easy",
"domain": "creative",
"model": "llama3.2:3b"
},
{
"query": "What is the difference between `malloc` and `calloc` in C?",
"complexity": 0.17,
"tier": "easy",
"domain": "factual",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a Python script to fetch JSON from an API and pretty‑print it.",
"complexity": 0.24,
"tier": "easy",
"domain": "code",
"model": "mistral-small-latest"
},
{
"query": "Debug this React hook: `useEffect(() => { setCount(count+1) }, [])` – why infinite loop?",
"complexity": 0.4,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Implement a deep copy function for nested dictionaries in Python.",
"complexity": 0.39,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Explain the `volatile` keyword in Java.",
"complexity": 0.44,
"tier": "medium",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Write a SQL query to delete duplicate rows keeping one copy.",
"complexity": 0.41,
"tier": "medium",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Why does this Python code raise `UnboundLocalError`? `x = 10; def foo(): print(x); x=5`",
"complexity": 0.26,
"tier": "easy",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Implement a simple key‑value store with TTL (time‑to‑live) in Python.",
"complexity": 0.57,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Translate 'The warranty is void if seal is broken' to Mandarin.",
"complexity": 0.36,
"tier": "medium",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Summarize the paper 'Attention is All You Need' in 5 bullet points.",
"complexity": 0.49,
"tier": "medium",
"domain": "summarization",
"model": "gemini-1.5-pro"
},
{
"query": "Solve `det([[1,2],[3,4]])` (determinant).",
"complexity": 0.18,
"tier": "easy",
"domain": "math",
"model": "llama3.1:8b"
},
{
"query": "Explain the chemical process of rusting.",
"complexity": 0.23,
"tier": "easy",
"domain": "science",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a limerick about a null pointer",
"complexity": 0.29,
"tier": "easy",
"domain": "creative",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "What is a JIT compiler? Give an example runtime.",
"complexity": 0.34,
"tier": "medium",
"domain": "factual",
"model": "mistral-large-latest"
},
{
"query": "Write a C# method that reads a CSV file and returns a list of objects.",
"complexity": 0.42,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Fix the JSON syntax error: `{name: 'John', age: 30}`",
"complexity": 0.06,
"tier": "trivial",
"domain": "code",
"model": "llama3.2:3b"
},
{
"query": "Implement a rate limiter using the token bucket algorithm in Python.",
"complexity": 0.65,
"tier": "hard",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Explain the output `(0 == '0')` vs `(0 === '0')` in JavaScript.",
"complexity": 0.16,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Write a Bash script to find all `.log` files older than 7 days and compress them.",
"complexity": 0.38,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Debug this Python multiprocessing code that hangs: `p = Pool(); p.map(f, range(10)); p.close()` (missing join).",
"complexity": 0.33,
"tier": "medium",
"domain": "code",
"model": "claude-3-haiku-20240307"
},
{
"query": "Write a regular expression to match a valid IPv4 address.",
"complexity": 0.48,
"tier": "medium",
"domain": "code",
"model": "llama3.1:70b"
},
{
"query": "Translate 'Please sign here' to Russian.",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Summarize the concept of 'copy‑on‑write' in operating systems.",
"complexity": 0.37,
"tier": "medium",
"domain": "summarization",
"model": "deepseek-chat"
},
{
"query": "Solve `dy/dx = y` with initial condition y(0)=1.",
"complexity": 0.3,
"tier": "medium",
"domain": "math",
"model": "gpt-4o"
},
{
"query": "Explain the Doppler effect with an example.",
"complexity": 0.27,
"tier": "easy",
"domain": "science",
"model": "gemini-1.5-pro"
},
{
"query": "Write a tanka (5 lines) about a broken build pipeline.",
"complexity": 0.35,
"tier": "medium",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "What is the difference between `INNER JOIN` and `LEFT JOIN`?",
"complexity": 0.21,
"tier": "easy",
"domain": "factual",
"model": "gpt-3.5-turbo"
},
{
"query": "Write a Python script that watches a directory for new files and processes them.",
"complexity": 0.56,
"tier": "medium",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Fix the off‑by‑one error: `for i in range(1, len(arr)): if arr[i] > arr[i-1]:` – correct.",
"complexity": 0.12,
"tier": "easy",
"domain": "code",
"model": "gpt-4o-mini"
},
{
"query": "Implement a Bloom filter in Python (simple version).",
"complexity": 0.6,
"tier": "hard",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Explain why `'5' - 3` works but `'5' + 3` gives different results in JavaScript.",
"complexity": 0.31,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Write a Golang function that reads a file line by line.",
"complexity": 0.26,
"tier": "easy",
"domain": "code",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'This is a confidential document' to German.",
"complexity": 0.2,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Summarize the key differences between TCP and UDP.",
"complexity": 0.24,
"tier": "easy",
"domain": "summarization",
"model": "gpt-4o"
},
{
"query": "Solve the eigenvalue problem for matrix `[[2, 1], [1, 2]]`.",
"complexity": 0.53,
"tier": "medium",
"domain": "math",
"model": "llama3.1:70b"
},
{
"query": "Explain the double‑slit experiment in quantum mechanics.",
"complexity": 0.58,
"tier": "hard",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Write a sonnet about a race condition (14 lines).",
"complexity": 0.63,
"tier": "hard",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "What is the purpose of `__slots__` in Python?",
"complexity": 0.41,
"tier": "medium",
"domain": "factual",
"model": "gpt-4o-mini"
},
{
"query": "Write a Rust function that takes a string and returns the first word.",
"complexity": 0.32,
"tier": "medium",
"domain": "code",
"model": "gemini-1.5-pro"
},
{
"query": "Fix the SQL injection in this PHP code: `$query = \"SELECT * FROM users WHERE id = $_GET[id]\";`",
"complexity": 0.29,
"tier": "easy",
"domain": "code",
"model": "gpt-3.5-turbo"
},
{
"query": "Implement a priority queue using a binary heap in Java.",
"complexity": 0.55,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Why does `a = []; a.append(a)` cause infinite recursion when printed? Explain.",
"complexity": 0.34,
"tier": "medium",
"domain": "code",
"model": "llama3.1:8b"
},
{
"query": "Write a JavaScript function that deep freezes an object.",
"complexity": 0.46,
"tier": "medium",
"domain": "code",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'Temperature exceeds safe limit' to Japanese.",
"complexity": 0.25,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Summarize the plot of 'The Metamorphosis' by Kafka.",
"complexity": 0.33,
"tier": "medium",
"domain": "summarization",
"model": "gemini-1.5-flash"
},
{
"query": "Solve `lim x→0 (sin x)/x`.",
"complexity": 0.22,
"tier": "easy",
"domain": "math",
"model": "mistral-small-latest"
},
{
"query": "Explain why the sky appears blue (Rayleigh scattering).",
"complexity": 0.28,
"tier": "easy",
"domain": "science",
"model": "claude-3-haiku-20240307"
},
{
"query": "Write a seven‑line poem about a memory leak.",
"complexity": 0.38,
"tier": "medium",
"domain": "creative",
"model": "llama3.2:3b"
},
{
"query": "What is the difference between a thread and a coroutine?",
"complexity": 0.43,
"tier": "medium",
"domain": "factual",
"model": "gpt-4o-mini"
},
{
"query": "Write a Python script that converts a CSV to JSON.",
"complexity": 0.31,
"tier": "medium",
"domain": "code",
"model": "deepseek-chat"
},
{
"query": "Fix the race condition in this Python async code: `async def f(): global x; x+=1` (use lock).",
"complexity": 0.51,
"tier": "medium",
"domain": "code",
"model": "gpt-4o"
},
{
"query": "Translate 'The quick brown fox jumps over the lazy dog' to Spanish.",
"complexity": 0.12,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Paraphrase this sentence: 'Despite the rain, the event was a huge success.'",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'Where is the nearest metro station?' to French.",
"complexity": 0.1,
"tier": "trivial",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "Correct the grammar: 'He don't know nothing about that.'",
"complexity": 0.09,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'I would like to order a vegetarian pizza' to Italian.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Rewrite this in formal English: 'Hey, can you send me the doc ASAP?'",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'The system is under maintenance' to German.",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:8b"
},
{
"query": "Convert this passive voice to active: 'The report was written by John.'",
"complexity": 0.08,
"tier": "trivial",
"domain": "translation",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Translate 'What is your name?' to Mandarin Chinese (pinyin).",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Paraphrase the idiom 'It's raining cats and dogs' into plain English.",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Translate 'Please call back later' to Japanese.",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Change this sentence to past tense: 'I go to the gym every day.'",
"complexity": 0.06,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Translate 'The price does not include tax' to Portuguese.",
"complexity": 0.12,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Summarize this paragraph in 10 words: 'Machine learning is a subset of artificial intelligence that enables systems to learn from data.'",
"complexity": 0.19,
"tier": "easy",
"domain": "summarization",
"model": "llama3.1:70b"
},
{
"query": "Translate 'I have a meeting at 3 PM' to Russian.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Explain the difference between 'affect' and 'effect' with examples.",
"complexity": 0.17,
"tier": "easy",
"domain": "factual",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'Your session has expired' to Arabic.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Rewrite this sentence more concisely: 'Due to the fact that it was raining, we canceled the picnic.'",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'Can you help me with this problem?' to Hindi (Romanized).",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Change this to a question: 'She knows the answer.'",
"complexity": 0.05,
"tier": "trivial",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "Translate 'The file is corrupted' to Korean.",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Paraphrase this technical sentence: 'Authentication via OAuth 2.0 provides delegated access.'",
"complexity": 0.34,
"tier": "medium",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Translate a short poem from English to French (preserve rhyme).",
"complexity": 0.45,
"tier": "medium",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Detect the language of this text: 'Bonjour, comment ça va?' and translate to English.",
"complexity": 0.2,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Write a grammatically correct sentence using 'their', 'there', and 'they're'.",
"complexity": 0.12,
"tier": "easy",
"domain": "creative",
"model": "llama3.1:8b"
},
{
"query": "Translate 'The application has encountered an unexpected error' to German.",
"complexity": 0.22,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Rewrite this in the imperative mood: 'You should read the instructions carefully.'",
"complexity": 0.09,
"tier": "trivial",
"domain": "translation",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'I apologize for the inconvenience' to Spanish.",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Convert this direct speech to indirect: He said he would come tomorrow.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Translate 'Please proceed to gate B12' to Japanese.",
"complexity": 0.17,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Simplify this legalese: 'The party of the first part shall indemnify the party of the second part.'",
"complexity": 0.41,
"tier": "medium",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'The deadline is Friday at 5 PM' to Italian.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Explain what a 'malapropism' is and give an example.",
"complexity": 0.26,
"tier": "easy",
"domain": "factual",
"model": "llama3.1:70b"
},
{
"query": "Translate a business email subject: 'Q3 Financial Results Attached' to French.",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Change this to future perfect tense: 'I finish the project.'",
"complexity": 0.1,
"tier": "trivial",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "Translate 'The server will reboot in 5 minutes' to Portuguese.",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Paraphrase this scientific abstract (2 sentences) for a general audience.",
"complexity": 0.39,
"tier": "medium",
"domain": "summarization",
"model": "deepseek-chat"
},
{
"query": "Translate 'Your payment was successful' to Russian.",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Rewrite this sentence in the negative form: 'Everyone attended the meeting.'",
"complexity": 0.07,
"tier": "trivial",
"domain": "translation",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Translate 'Please do not touch the glass' to Mandarin.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Correct the spelling: 'recieve', 'seperate', 'definately'",
"complexity": 0.06,
"tier": "trivial",
"domain": "translation",
"model": "llama3.1:8b"
},
{
"query": "Translate 'The operation was completed successfully' to Arabic.",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Convert this bullet list into a coherent paragraph.",
"complexity": 0.28,
"tier": "easy",
"domain": "summarization",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'What time does the store close?' to German.",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Explain the difference between 'who' and 'whom' with examples.",
"complexity": 0.22,
"tier": "easy",
"domain": "factual",
"model": "deepseek-chat"
},
{
"query": "Translate 'This feature is not yet implemented' to Spanish.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Rewrite this sentence using a simile: 'Her voice was loud.'",
"complexity": 0.2,
"tier": "easy",
"domain": "creative",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'Please verify your email address' to Japanese.",
"complexity": 0.17,
"tier": "easy",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "Change this from first person to third person: 'I think this solution is optimal.'",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Translate a chat message: 'BRB, gonna grab coffee' to formal English.",
"complexity": 0.12,
"tier": "easy",
"domain": "translation",
"model": "claude-3-haiku-20240307"
},
{
"query": "Paraphrase 'The new update includes several security patches' without changing meaning.",
"complexity": 0.19,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Translate 'The connection has timed out' to Italian.",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Write a haiku about the translator's dilemma.",
"complexity": 0.31,
"tier": "medium",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'Access denied' to French.",
"complexity": 0.06,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Explain the concept of 'cognates' in linguistics with examples.",
"complexity": 0.35,
"tier": "medium",
"domain": "science",
"model": "deepseek-chat"
},
{
"query": "Translate a short warning: 'High voltage, risk of electric shock' to Spanish.",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:70b"
},
{
"query": "Rewrite this in colloquial English: 'I am extremely fatigued.'",
"complexity": 0.1,
"tier": "trivial",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'The package will arrive within 2 business days' to German.",
"complexity": 0.19,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Change this sentence to exclamatory: 'It is a beautiful day.'",
"complexity": 0.05,
"tier": "trivial",
"domain": "translation",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Translate 'Please enter your password' to Korean.",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Summarize the difference between British and American English spelling (5 examples).",
"complexity": 0.27,
"tier": "easy",
"domain": "summarization",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'I don't understand this instruction' to Portuguese.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:8b"
},
{
"query": "Paraphrase this corporate jargon: 'We'll circle back on that action item.'",
"complexity": 0.22,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Translate 'Your account has been locked' to Arabic.",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Write a sentence using the word 'ubiquitous' correctly.",
"complexity": 0.12,
"tier": "easy",
"domain": "creative",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'The meeting was rescheduled to Monday' to Italian.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Change this from active to passive: 'The chef cooked a delicious meal.'",
"complexity": 0.08,
"tier": "trivial",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'Please wait while we process your request' to Japanese.",
"complexity": 0.2,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Explain the term 'portmanteau' and give three examples.",
"complexity": 0.25,
"tier": "easy",
"domain": "factual",
"model": "llama3.2:3b"
},
{
"query": "Translate a legal disclaimer: 'Not responsible for lost or stolen items' to French.",
"complexity": 0.33,
"tier": "medium",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Rewrite this sentence without using the word 'very': 'She was very tired.'",
"complexity": 0.09,
"tier": "trivial",
"domain": "translation",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'Your session will expire in 10 minutes' to Russian.",
"complexity": 0.17,
"tier": "easy",
"domain": "translation",
"model": "deepseek-chat"
},
{
"query": "Convert this to a rhetorical question: 'You should know better.'",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Translate 'The file size exceeds the limit' to Spanish.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Summarize the plot of 'The Tower of Babel' story in two sentences.",
"complexity": 0.25,
"tier": "easy",
"domain": "summarization",
"model": "gemini-1.5-flash"
},
{
"query": "Translate 'Please accept our sincere apologies' to German.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:70b"
},
{
"query": "Paraphrase this proverb: 'A bird in the hand is worth two in the bush.'",
"complexity": 0.2,
"tier": "easy",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Translate 'The system will restart automatically' to Mandarin.",
"complexity": 0.18,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o-mini"
},
{
"query": "Fix the subject‑verb agreement: 'The list of items are on the table.'",
"complexity": 0.07,
"tier": "trivial",
"domain": "translation",
"model": "llama3.2:3b"
},
{
"query": "Translate 'I've attached the document for your review' to Italian.",
"complexity": 0.17,
"tier": "easy",
"domain": "translation",
"model": "gpt-3.5-turbo"
},
{
"query": "Explain the difference between denotation and connotation with examples.",
"complexity": 0.29,
"tier": "easy",
"domain": "factual",
"model": "gemini-1.5-pro"
},
{
"query": "Translate 'Your request has been received' to Korean.",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
},
{
"query": "Rewrite this sentence using alliteration: 'The dog ran fast.'",
"complexity": 0.21,
"tier": "easy",
"domain": "creative",
"model": "deepseek-chat"
},
{
"query": "Translate 'The store is closed on Sundays' to Portuguese.",
"complexity": 0.13,
"tier": "easy",
"domain": "translation",
"model": "claude-3-5-haiku-20241022"
},
{
"query": "Change this from singular to plural: 'The child is playing.'",
"complexity": 0.04,
"tier": "trivial",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Translate 'Please note that prices are subject to change' to French.",
"complexity": 0.24,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:8b"
},
{
"query": "Paraphrase this headline: 'Tech Giant Announces Record Profits Amid Layoffs'",
"complexity": 0.26,
"tier": "easy",
"domain": "summarization",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'The shipment is delayed due to weather' to German.",
"complexity": 0.19,
"tier": "easy",
"domain": "translation",
"model": "mistral-small-latest"
},
{
"query": "Write a sentence that is grammatically correct but semantically nonsensical.",
"complexity": 0.23,
"tier": "easy",
"domain": "creative",
"model": "claude-3-haiku-20240307"
},
{
"query": "Translate 'Your feedback is valuable to us' to Japanese.",
"complexity": 0.16,
"tier": "easy",
"domain": "translation",
"model": "gemini-1.5-flash"
},
{
"query": "Explain what a 'double negative' is and why it's often avoided in standard English.",
"complexity": 0.2,
"tier": "easy",
"domain": "factual",
"model": "deepseek-chat"
},
{
"query": "Translate 'The server is experiencing high load' to Arabic.",
"complexity": 0.21,
"tier": "easy",
"domain": "translation",
"model": "gpt-4o"
},
{
"query": "Rewrite this sentence as a conditional: 'You didn't water the plant, so it died.'",
"complexity": 0.14,
"tier": "easy",
"domain": "translation",
"model": "llama3.1:70b"
},
{
"query": "Translate 'Congratulations on your promotion' to Spanish.",
"complexity": 0.11,
"tier": "easy",
"domain": "translation",
"model": "claude-3-5-sonnet-20241022"
},
{
"query": "Summarize the concept of 'code‑switching' in linguistics in one sentence.",
"complexity": 0.28,
"tier": "easy",
"domain": "science",
"model": "gpt-4o-mini"
},
{
"query": "Translate 'Please do not disturb' to Italian.",
"complexity": 0.09,
"tier": "trivial",
"domain": "translation",
"model": "gemini-1.5-pro"
},
{
"query": "Convert this sentence to use the subjunctive mood: 'I wish I was there.' (correction)",
"complexity": 0.15,
"tier": "easy",
"domain": "translation",
"model": "mistral-large-latest"
}
]