drzo commited on
Commit
425f10e
·
verified ·
1 Parent(s): aa62888

chore: update unicosys hypergraph model from CI pipeline

Browse files
README.md CHANGED
@@ -32,19 +32,19 @@ single trainable knowledge representation.
32
  | Text Encoder | 2-layer Transformer, 4 heads |
33
  | Graph Attention | 2-layer GAT, 4 heads |
34
  | Link Predictor | 2-layer MLP with margin ranking loss |
35
- | Total Parameters | **34,760,065** |
36
 
37
  ### Knowledge Graph Statistics
38
 
39
  | Metric | Count |
40
  |---|---|
41
- | Total Nodes | 203,646 |
42
- | Total Edges | 14,912 |
43
- | Cross-Links | 3,944 |
44
  | Entities | 16 |
45
- | Emails | 199,544 |
46
- | Financial Documents | 2,291 |
47
- | Timeline Events | 1,220 |
48
  | LEX Schemes | 13 |
49
  | Legal Filings | 7 |
50
 
@@ -53,9 +53,9 @@ single trainable knowledge representation.
53
  | Subsystem | Nodes |
54
  |---|---|
55
  | Core (Entities) | 16 |
56
- | Fincosys (Financial) | 3,908 |
57
- | Comcosys (Communications) | 199,544 |
58
- | RevStream1 (Evidence) | 145 |
59
  | Ad-Res-J7 (Legal) | 33 |
60
 
61
  ## Training
 
32
  | Text Encoder | 2-layer Transformer, 4 heads |
33
  | Graph Attention | 2-layer GAT, 4 heads |
34
  | Link Predictor | 2-layer MLP with margin ranking loss |
35
+ | Total Parameters | **36,023,681** |
36
 
37
  ### Knowledge Graph Statistics
38
 
39
  | Metric | Count |
40
  |---|---|
41
+ | Total Nodes | 272,683 |
42
+ | Total Edges | 14,816 |
43
+ | Cross-Links | 3,976 |
44
  | Entities | 16 |
45
+ | Emails | 199,553 |
46
+ | Financial Documents | 17,036 |
47
+ | Timeline Events | 54,346 |
48
  | LEX Schemes | 13 |
49
  | Legal Filings | 7 |
50
 
 
53
  | Subsystem | Nodes |
54
  |---|---|
55
  | Core (Entities) | 16 |
56
+ | Fincosys (Financial) | 72,935 |
57
+ | Comcosys (Communications) | 199,553 |
58
+ | RevStream1 (Evidence) | 146 |
59
  | Ad-Res-J7 (Legal) | 33 |
60
 
61
  ## Training
config.json CHANGED
@@ -15,7 +15,7 @@
15
  "gat_num_layers": 2,
16
  "hidden_dim": 256,
17
  "margin": 1.0,
18
- "max_nodes": 250000,
19
  "model_type": "unicosys_hypergraph",
20
  "negative_sample_ratio": 5,
21
  "node_embed_dim": 128,
@@ -31,10 +31,10 @@
31
  "lex_scheme": 8,
32
  "timeline_event": 9
33
  },
34
- "num_cross_links": 3944,
35
  "num_edge_types": 4,
36
  "num_entities": 16,
37
- "num_evidence": 203646,
38
  "num_node_types": 10,
39
  "num_subsystems": 7,
40
  "subsystem_vocab": {
@@ -50,6 +50,6 @@
50
  "text_max_length": 128,
51
  "text_num_heads": 4,
52
  "text_num_layers": 2,
53
- "text_vocab_size": 224,
54
  "transformers_version": "5.3.0"
55
  }
 
15
  "gat_num_layers": 2,
16
  "hidden_dim": 256,
17
  "margin": 1.0,
18
+ "max_nodes": 260000,
19
  "model_type": "unicosys_hypergraph",
20
  "negative_sample_ratio": 5,
21
  "node_embed_dim": 128,
 
31
  "lex_scheme": 8,
32
  "timeline_event": 9
33
  },
34
+ "num_cross_links": 3976,
35
  "num_edge_types": 4,
36
  "num_entities": 16,
37
+ "num_evidence": 272683,
38
  "num_node_types": 10,
39
  "num_subsystems": 7,
40
  "subsystem_vocab": {
 
50
  "text_max_length": 128,
51
  "text_num_heads": 4,
52
  "text_num_layers": 2,
53
+ "text_vocab_size": 160,
54
  "transformers_version": "5.3.0"
55
  }
graph_data.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:689217569f864fd7fe3a8d4654c31713ea85b50ae911059aded14327677bc084
3
- size 5269536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a22a6c8e60034f66c5837cc6d0291942b39702f169f12882a25f084361aa669f
3
+ size 6363552
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b04319465516bc36f8001497133b081f28f38152c992b54d70aa352669902be1
3
- size 139047108
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:502a653c3fc9bbcfd1845c3d45e9c0ede50be7b32bddb14af610e92b8354b8d3
3
+ size 144101572
model_summary.json CHANGED
@@ -1,30 +1,30 @@
1
  {
2
  "case_number": "2025-137857",
3
- "total_nodes": 203646,
4
- "total_edges": 15901,
5
- "total_cross_links": 3944,
6
  "node_types": {
7
  "entity": 16,
8
- "entity_document": 2291,
9
- "timeline_event": 1220,
10
- "hypergraph_node": 551,
11
- "fund_flow_analysis": 4,
12
- "email": 199544,
13
  "lex_scheme": 13,
14
  "legal_filing": 7
15
  },
16
  "edge_types": {
17
- "proves": 14911,
18
  "transaction_evidenced_by": 1
19
  },
20
  "subsystems": {
21
  "core": 16,
22
- "fincosys": 3908,
23
- "comcosys": 199544,
24
- "revstream1": 145,
25
  "ad_res_j7": 33
26
  },
27
- "model_params": 34760065,
28
  "model_architecture": {
29
  "node_embed_dim": 128,
30
  "text_embed_dim": 256,
 
1
  {
2
  "case_number": "2025-137857",
3
+ "total_nodes": 250000,
4
+ "total_edges": 15131,
5
+ "total_cross_links": 3976,
6
  "node_types": {
7
  "entity": 16,
8
+ "entity_document": 17036,
9
+ "timeline_event": 54346,
10
+ "hypergraph_node": 1692,
11
+ "fund_flow_analysis": 20,
12
+ "email": 199553,
13
  "lex_scheme": 13,
14
  "legal_filing": 7
15
  },
16
  "edge_types": {
17
+ "proves": 14815,
18
  "transaction_evidenced_by": 1
19
  },
20
  "subsystems": {
21
  "core": 16,
22
+ "fincosys": 72935,
23
+ "comcosys": 199553,
24
+ "revstream1": 146,
25
  "ad_res_j7": 33
26
  },
27
+ "model_params": 36023681,
28
  "model_architecture": {
29
  "node_embed_dim": 128,
30
  "text_embed_dim": 256,
node_id_mapping.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer.json CHANGED
@@ -55,73 +55,9 @@
55
  "@": 54,
56
  "_": 55,
57
  "*": 56,
58
- "[": 57,
59
- "]": 58,
60
- "\ud83d\udfe2": 59,
61
- "|": 60,
62
- "\u2014": 61,
63
- "\"": 62,
64
- "\ud83c\udfd5": 63,
65
- "\ufe0f": 64,
66
- "!": 65,
67
- "\u2019": 66,
68
- "\ud83d\udd52": 67,
69
- "=": 68,
70
- "$": 69,
71
- ";": 70,
72
- "?": 71,
73
- "\u00a3": 72,
74
- "\u2013": 73,
75
- "\u2026": 74,
76
- "\ud83c\udfac": 75,
77
- "\u2601": 76,
78
- "{": 77,
79
- "}": 78,
80
- "\u201c": 79,
81
- "\u201d": 80,
82
- "\ud83d\udd25": 81,
83
- "\ud83d\udd11": 82,
84
- "\ud83d\udc40": 83,
85
- "\ud83c\udfc3": 84,
86
- "\u200d": 85,
87
- "\u2640": 86,
88
- "\ud83d\udea8": 87,
89
- "\ud83d\udd17": 88,
90
- "\ud83d\ude80": 89,
91
- "\ud83e\uddd0": 90,
92
- "\ud83d\uddd3": 91,
93
- "\ud83d\udcac": 92,
94
- "\u26a0": 93,
95
- "\ud83d\ude31": 94,
96
- "\ud83c\udf0d": 95,
97
- "\ud83e\udee7": 96,
98
- "\ud83e\udd76": 97,
99
- "\ud83d\udc64": 98,
100
- "\ud83c\udf89": 99,
101
- "\ud83d\udcc8": 100,
102
- "\ud83c\udf38": 101,
103
- "\u00a0": 102,
104
- "\ud83d\udc8c": 103,
105
- "\u2122": 104,
106
- "\u00f1": 105,
107
- "\u263a": 106,
108
- "\ud83d\udc9c": 107,
109
- "\u26f3": 108,
110
- "\u26a1": 109,
111
- "\u23f0": 110,
112
- "\u2728": 111,
113
- "\u2018": 112,
114
- "\ud83c\udfe0": 113,
115
- "\ud83c\udfe1": 114,
116
- "\u00ae": 115,
117
- "\ud83d\udcb8": 116,
118
- "~": 117,
119
- "\ud83c\udf9f": 118,
120
- "\ud83d\udd14": 119,
121
- "\ud83d\ude97": 120,
122
- "\ud83e\udde0": 121,
123
- "\ud83c\udf0e": 122,
124
- "\u2011": 123
125
  },
126
- "next_id": 124
127
  }
 
55
  "@": 54,
56
  "_": 55,
57
  "*": 56,
58
+ "=": 57,
59
+ "<": 58,
60
+ ">": 59
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
61
  },
62
+ "next_id": 60
63
  }