File size: 1,631 Bytes
da6e1f7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
{
  "model_type": "RandomForestClassifier",
  "library": "sklearn",
  "task": "text-classification",
  "subtask": "query-dependency-detection",
  "feature_names": [
    "q1_length",
    "q2_length",
    "length_diff",
    "length_ratio",
    "q1_char_length",
    "q2_char_length",
    "char_length_ratio",
    "common_words",
    "jaccard_similarity",
    "word_overlap_ratio",
    "stem_overlap",
    "bigram_overlap",
    "trigram_overlap",
    "pronoun_count",
    "reference_count",
    "connective_count",
    "early_pronoun_count",
    "early_reference_count",
    "early_connective_count",
    "dependency_phrase_count",
    "has_dependency_phrase",
    "semantic_similarity",
    "entity_overlap",
    "q1_exclamation",
    "q2_exclamation",
    "q1_comma_count",
    "q2_comma_count",
    "q1_avg_word_length",
    "q2_avg_word_length",
    "complexity_diff",
    "q1_syllable_density",
    "q2_syllable_density",
    "continuation_markers",
    "contrast_markers",
    "causation_markers",
    "exemplification_markers",
    "elaboration_markers",
    "repeated_words_q2",
    "max_word_repetition",
    "q1_caps_words",
    "q2_caps_words",
    "spatial_references",
    "temporal_references",
    "comparative_references",
    "quantitative_references"
  ],
  "label_classes": [
    "dependent",
    "independent"
  ],
  "num_features": 45,
  "model_params": {
    "n_estimators": 500,
    "max_depth": 15,
    "min_samples_split": 7,
    "min_samples_leaf": 3,
    "max_features": "sqrt",
    "random_state": 42,
    "class_weight": "balanced"
  },
  "created_at": "2025-07-25T18:08:02.989967",
  "version": "1.0.0"
}