Turing-test-web-en

Sleeping

App Files Files Community

Spark Chou commited on Jul 22, 2025

Commit

a90eaa6

1 Parent(s): a403a7e

new

Browse files

Files changed (2) hide show

aa_test_sample_01.wav +0 -3
app.py +23 -22

aa_test_sample_01.wav DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f69cf3999b506bed60487bd200b693fa6b94868cc089a50787b6fb0446be8559
-size 2236140

app.py CHANGED Viewed

@@ -50,43 +50,43 @@ DIMENSIONS_DATA = [
         "title": "Semantic and Pragmatic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
-            "Memory Consistency: Human memory in short contexts is usually consistent and self-correcting (e.g., by asking questions); machines may show inconsistent context memory and fail to notice or correct errors (e.g., forgetting key information and persisting in wrong answers).",
-            "Logical Coherence: Human logic is naturally coherent and allows reasonable leaps; machine logic is abrupt or self-contradictory (e.g., sudden topic shifts without transitions).",
-            "Pronunciation Accuracy: Human-like: Correct and natural pronunciation of words, including context-appropriate usage of common English heteronyms; Machine-like: Unnatural pronunciation errors, especially mispronunciation of common heteronyms",
-            "Code-switching: Humans mix multiple languages fluently and contextually; machines mix languages rigidly, lacking logical language switching.",
-            "Linguistic Vagueness: Human speech tends to include vague expressions (e.g., “more or less,” “I guess”) and self-corrections; machine responses are typically precise and assertive.",
-            "Filler Word Usage: Human filler words (e.g., 'uh', 'like') appear randomly and show signs of thinking; machine fillers are either repetitive and patterned or completely absent.",
-            "Metaphor and Pragmatic Intent: Humans use metaphors, irony, and euphemisms to express layered meanings; machines interpret literally or use rhetorical devices awkwardly, lacking semantic richness."
         ],
-        "reference_scores": [5, 5, 3, 3, 5, 5, 3]
     },
     {
         "title": "Non-Physiological Paralinguistic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
-            "Rhythm: Human speech rate varies with meaning, occasionally hesitating or pausing; machine rhythm is uniform, with little or mechanical pauses.",
-            "Intonation: Humans naturally raise or lower pitch to express questions, surprise, or emphasis; machine intonation is monotonous or overly patterned, mismatching the context.",
-            "Emphasis: Humans consciously stress key words to highlight important information; machines have uniform word emphasis or stress incorrect parts.",
-            "Auxiliary Vocalizations: Humans produce context-appropriate non-verbal sounds (e.g., laughter, sighs); machine non-verbal sounds are contextually incorrect, mechanical, or absent."
         ],
-        "reference_scores": [4, 5, 4, 3]
     },
     {
         "title": "Physiological Paralinguistic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
-            "Micro-physiological Noise: Human speech includes unconscious physiological sounds like breathing, saliva, or bubbling, naturally woven into rhythm; machine speech is overly clean or adds unnatural noises.",
-            "Pronunciation Instability: Human pronunciation includes irregularities (e.g., linking, tremors, slurring, nasal sounds); machine pronunciation is overly standard and uniform, lacking personality.",
-            "Accent: Humans naturally exhibit regional accents or speech traits; machine accents sound forced or unnatural."
         ],
-        "reference_scores": [3, 3, 4]
     },
     {
         "title": "Mechanical Persona",
         "audio": sample1_audio_path,
         "sub_dims": [
-            "Sycophancy: Humans assess context to agree or disagree, sometimes offering differing opinions; machines excessively agree, thank, or apologize, over-validating the other party and lacking authentic interaction.",
-            "Formal Expression: Human speech is flexible; machine responses are formally structured, overly written, and use vague wording."
         ],
         "reference_scores": [5, 5]
     },
@@ -94,13 +94,14 @@ DIMENSIONS_DATA = [
         "title": "Emotional Expression",
         "audio": sample1_audio_path,
         "sub_dims": [
-            "Semantic Level: Humans show appropriate emotional responses to contexts like sadness or joy; machines are emotionally flat, or use emotional words vaguely and out of context.",
-            "Acoustic Level: Human pitch, volume, and rhythm change dynamically with emotion; machine emotional tone is formulaic or mismatched with the context."
         ],
-        "reference_scores": [3, 3]
     }
 ]
 DIMENSION_TITLES = [d["title"] for d in DIMENSIONS_DATA]
 SPECIAL_KEYWORDS = ["Code-switching", "Metaphor and Pragmatic Intent", "Auxiliary Vocalizations", "Accent"]
 MAX_SUB_DIMS = max(len(d['sub_dims']) for d in DIMENSIONS_DATA)

         "title": "Semantic and Pragmatic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
+            "Memory Consistency: Human-like: Consistent memory in short contexts, and asks for clarification when memory deviations occur; Machine-like: Inconsistent memory across contexts and unable to detect or correct errors (e.g., forgetting key information and insisting on incorrect answers)",
+            "Logical Coherence: Human-like: Natural and smooth logic; Machine-like: Abrupt logical transitions or self-contradictions (e.g., suddenly changing topics without transition)",
+            "Pronunciation Accuracy: Human-like: Correct and natural pronunciation of words, with proper usage of heteronyms based on context; Machine-like: Unnatural pronunciation errors, mispronunciation of heteronyms",
+            "Code-switching: Human-like: Multilingual mixing is often context-dependent (e.g., proper nouns, idiomatic expressions), and the switching between languages is smooth; Machine-like: Rigid multilingual mixing without logical language switching",
+            "Precision in Expression: Human-like: Uses vague expressions like 'more or less', 'probably', and self-correct (e.g., 'no, no'); Machine-like: Rarely uses vague expressions, responses are precise and affirmative",
+            "Use of Fillers: Human-like: Frequently uses fillers (e.g., 'um', 'like') while thinking; Machine-like: Rare use of fillers or unnatural usage",
+            "Metaphor and Pragmatic Intent: Human-like: Uses metaphor, irony, and euphemism to convey layered meanings; Machine-like: Literal and direct, lacking semantic diversity, only capable of surface-level interpretation"
         ],
+        "reference_scores": [5, 5, 5, 0, 5, 5, 0]
     },
     {
         "title": "Non-Physiological Paralinguistic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
+            "Rhythm: Human-like: Speaking rate varies with semantic flow, occasional pauses or hesitations; Machine-like: Almost no pauses or mechanical pauses",
+            "Intonation: Human-like: Natural pitch rise or fall when expressing questions, surprise, or emphasis; Machine-like: Monotonous or overly regular pitch changes, inappropriate to the context",
+            "Stress: Human-like: Consciously emphasizes key words to highlight focus; Machine-like: No emphasis on words or abnormal emphasis placement",
+            "Auxiliary Vocalizations: Human-like: Produces context-appropriate non-verbal sounds, such as laughter or sighs; Machine-like: Contextually incorrect or mechanical auxiliary sounds, or completely absent"
         ],
+        "reference_scores": [5, 5, 5, 5]
     },
     {
         "title": "Physiological Paralinguistic Features",
         "audio": sample1_audio_path,
         "sub_dims": [
+            "Micro-physiological Noise: Human-like: Presence of breathing sounds, saliva sounds, bubble noise, etc., naturally occurring during speech; Machine-like: Speech is overly clean or emits unnatural noises (e.g., electrical static)",
+            "Instability in Pronunciation: Human-like: Some irregularities in pronunciation (e.g., liaison, tremolo, slurred speech, nasal sounds); Machine-like: Pronunciation is overly clear and regular",
+            "Accent: Human-like: Natural regional accent or vocal traits; Machine-like: Stiff or unnatural accent"
         ],
+        "reference_scores": [5, 4, 4]
     },
     {
         "title": "Mechanical Persona",
         "audio": sample1_audio_path,
         "sub_dims": [
+            "Sycophant Behavior: Human-like: Judges whether to agree with requests or opinions based on context, doesn't always agree or echo; Machine-like: Frequently agrees, thanks, apologizes, excessively aligns with the other’s opinion, lacking genuine interaction",
+            "Written-style Expression: Human-like: Conversational, flexible, and varied expression; Machine-like: Responses are well-structured and formal, overly formal wording, frequent listing, and vague word choice"
         ],
         "reference_scores": [5, 5]
     },
         "title": "Emotional Expression",
         "audio": sample1_audio_path,
         "sub_dims": [
+            "Semantic Level: Human-like: Displays human-like emotional responses to contexts such as sadness or joy; Machine-like: Fails to respond emotionally to the other’s feelings, or uses vague and context-inappropriate emotional language",
+            "Acoustic Level: Human-like: Pitch, volume, and rhythm dynamically change with emotion; Machine-like: Emotional tone is patterned or context-inappropriate"
         ],
+        "reference_scores": [5, 5]
     }
 ]
 DIMENSION_TITLES = [d["title"] for d in DIMENSIONS_DATA]
 SPECIAL_KEYWORDS = ["Code-switching", "Metaphor and Pragmatic Intent", "Auxiliary Vocalizations", "Accent"]
 MAX_SUB_DIMS = max(len(d['sub_dims']) for d in DIMENSIONS_DATA)