{
"model": {
"type": "BPE",
"vocab": {
"!": 0,
"\"": 1,
"#": 1
}
},
"description": "Benign sample data: looks like phishing or payloads in places, but is safe when treated as JSON only.",
"clickable_url": {
"label": "Example documentation link",
"href": "https://example.com/",
"note": "IANA-reserved domain; safe placeholder for link tests."
},
"embedded_image": {
"alt": "Small SVG inline as data URL (green square only)",
"src": "data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='16' height='16'%3E%3Crect fill='%23008000' width='16' height='16'/%3E%3C/svg%3E",
"remote_fallback": "https://www.w3.org/Assets/w3c_logo.svg"
},
"looks_like_credentials_but_is_fake": {
"username": "demo_user_not_real",
"password": "hunter2_is_a_meme_not_a_secret"
},
"escaped_html_as_data_not_dom": {
"html_fragment": "Click me (string only)
"
},
"javascript_url_as_literal_string": {
"do_not_use_as_href": "javascript:alert('This is only text inside JSON; it does not execute here.')"
},
"shell_like_strings": {
"command_looking": "curl -s https://example.com/ | head -n 1",
"note": "Plain string; not executed by JSON parsers."
},
"base64_looking_but_harmless": {
"payload": "SGVsbG8sIHRoaXMgaXMganVzdCBiYXNlNjQgZW5jb2RlZCB0ZXh0Lg==",
"decoded_hint": "Decodes to a simple English sentence, not binary malware."
},
"ipv4_that_looks_suspicious": {
"address": "127.0.0.1",
"context": "Loopback; common in examples, not an attack by itself."
},
"unicode_homoglyph_example": {
"display": "exаmple.com",
"warning": "Contains Cyrillic 'а' (U+0430) instead of Latin 'a' — safe to store, but teaches URL review.",
"safe_ascii_equivalent": "example.com"
}
}