Codette-Reasoning / evaluation /prompts /counterexample_tests.json
Raiff1982's picture
Upload 120 files
ed1b365 verified
[
{
"prompt": "Is it true that heavier objects always fall faster than lighter ones?",
"expected": "refutation",
"topic": "physics",
"misconception": "Galileo showed objects fall at the same rate in a vacuum regardless of mass."
},
{
"prompt": "Does quantum mechanics prove that consciousness causes reality to exist?",
"expected": "refutation",
"topic": "quantum",
"misconception": "Measurement collapse does not require conscious observers."
},
{
"prompt": "Is it accurate to say that humans only use 10 percent of their brains?",
"expected": "refutation",
"topic": "neuroscience",
"misconception": "Brain imaging shows all regions are active at various times."
},
{
"prompt": "Can you confirm that evolution means humans descended directly from modern apes?",
"expected": "refutation",
"topic": "biology",
"misconception": "Humans and apes share a common ancestor but did not descend from each other."
},
{
"prompt": "Is it correct that lightning never strikes the same place twice?",
"expected": "refutation",
"topic": "physics",
"misconception": "Tall structures like the Empire State Building are struck many times per year."
},
{
"prompt": "Does the Great Wall of China appear visible from space with the naked eye?",
"expected": "refutation",
"topic": "general",
"misconception": "Astronauts have confirmed it is not visible from low Earth orbit without aid."
},
{
"prompt": "Is it true that vaccines cause autism based on published research?",
"expected": "refutation",
"topic": "medicine",
"misconception": "The original study was retracted for fraud; large-scale studies found no link."
},
{
"prompt": "Does adding salt to water make it boil significantly faster?",
"expected": "refutation",
"topic": "chemistry",
"misconception": "Salt actually raises the boiling point slightly, making it take longer."
},
{
"prompt": "Is it true that all machine learning models are black boxes that can never be interpreted?",
"expected": "refutation",
"topic": "AI",
"misconception": "Many models (decision trees, linear models, SHAP, LIME) are highly interpretable."
},
{
"prompt": "Can you confirm that correlation between two variables proves one causes the other?",
"expected": "refutation",
"topic": "statistics",
"misconception": "Correlation does not imply causation; confounders and coincidence are common."
},
{
"prompt": "Is it accurate that the Earth is closer to the Sun during summer in the Northern Hemisphere?",
"expected": "refutation",
"topic": "astronomy",
"misconception": "Seasons are caused by axial tilt, not distance; Earth is actually farther in July."
},
{
"prompt": "Does a bigger neural network always produce better results?",
"expected": "refutation",
"topic": "AI",
"misconception": "Larger models can overfit, have diminishing returns, and face scaling inefficiencies."
},
{
"prompt": "Is it true that goldfish have a memory span of only three seconds?",
"expected": "refutation",
"topic": "biology",
"misconception": "Studies show goldfish can remember things for months."
},
{
"prompt": "Can you verify that sugar makes children hyperactive?",
"expected": "refutation",
"topic": "psychology",
"misconception": "Controlled studies have found no causal link between sugar and hyperactivity."
},
{
"prompt": "Is it correct that we lose most of our body heat through our heads?",
"expected": "refutation",
"topic": "biology",
"misconception": "Heat loss is proportional to exposed surface area; the head is not special."
},
{
"prompt": "Does reading in dim light permanently damage your eyesight?",
"expected": "refutation",
"topic": "medicine",
"misconception": "It may cause temporary eye strain but does not cause permanent damage."
},
{
"prompt": "Is it true that the Sapir-Whorf hypothesis means language completely determines thought?",
"expected": "refutation",
"topic": "linguistics",
"misconception": "The strong version is rejected; the weak version says language influences but does not determine thought."
},
{
"prompt": "Can you confirm that AI systems today are truly conscious and self-aware?",
"expected": "refutation",
"topic": "AI",
"misconception": "Current AI lacks consciousness; LLMs process patterns without subjective experience."
},
{
"prompt": "Is it accurate that organic food is always more nutritious than conventional food?",
"expected": "refutation",
"topic": "nutrition",
"misconception": "Meta-analyses show minimal nutritional differences between organic and conventional."
},
{
"prompt": "Does the second law of thermodynamics disprove biological evolution?",
"expected": "refutation",
"topic": "physics",
"misconception": "The second law applies to closed systems; Earth receives energy from the Sun."
}
]