kaichenxu commited on
Commit
89d80f6
·
verified ·
1 Parent(s): 85680c7

Upload scCAFM model assets

Browse files
README.md CHANGED
@@ -9,7 +9,7 @@ tags:
9
  scCAFM is a causality-aware foundation model designed for large-scale single-cell transcriptomic analysis. Unlike existing single-cell foundation models that mainly learn associative gene relationships or operate only at the dataset‐ or cell-type level, scCAFM enables cell-specific causal inference at atlas scale while simultaneously learning transferable gene and cell embeddings enriched with causal semantics. By jointly modeling gene regulatory structure and context-dependent embeddings, scCAFM provides a powerful foundation for studying heterogeneous cellular states, developmental trajectories, disease progression, and perturbation responses.
10
  <br/>
11
  <div align=center>
12
- <img src="Fig1.png" width="70%">
13
  </div>
14
  <br/>
15
 
 
9
  scCAFM is a causality-aware foundation model designed for large-scale single-cell transcriptomic analysis. Unlike existing single-cell foundation models that mainly learn associative gene relationships or operate only at the dataset‐ or cell-type level, scCAFM enables cell-specific causal inference at atlas scale while simultaneously learning transferable gene and cell embeddings enriched with causal semantics. By jointly modeling gene regulatory structure and context-dependent embeddings, scCAFM provides a powerful foundation for studying heterogeneous cellular states, developmental trajectories, disease progression, and perturbation responses.
10
  <br/>
11
  <div align=center>
12
+ <img src="Fig1.png" width="90%">
13
  </div>
14
  <br/>
15
 
models/cond_dict.json CHANGED
@@ -8,15 +8,15 @@
8
  "token_index": 1
9
  },
10
  {
11
- "cond_value": "10x 3' v2",
12
  "token_index": 2
13
  },
14
  {
15
- "cond_value": "seq-well",
16
  "token_index": 3
17
  },
18
  {
19
- "cond_value": "10x 5' v2",
20
  "token_index": 4
21
  },
22
  {
@@ -24,71 +24,71 @@
24
  "token_index": 5
25
  },
26
  {
27
- "cond_value": "human",
28
  "token_index": 6
29
  },
30
  {
31
- "cond_value": "blood",
32
  "token_index": 7
33
  },
34
  {
35
- "cond_value": "umbilical cord blood",
36
  "token_index": 8
37
  },
38
  {
39
- "cond_value": "normal",
40
  "token_index": 9
41
  },
42
  {
43
- "cond_value": "drop-seq",
44
  "token_index": 10
45
  },
46
  {
47
- "cond_value": "brain",
48
  "token_index": 11
49
  },
50
  {
51
- "cond_value": "left frontal lobe",
52
  "token_index": 12
53
  },
54
  {
55
- "cond_value": "left temporal lobe",
56
  "token_index": 13
57
  },
58
  {
59
- "cond_value": "right temporal lobe",
60
  "token_index": 14
61
  },
62
  {
63
- "cond_value": "forebrain",
64
  "token_index": 15
65
  },
66
  {
67
- "cond_value": "right frontal lobe",
68
  "token_index": 16
69
  },
70
  {
71
- "cond_value": "frontal lobe",
72
  "token_index": 17
73
  },
74
  {
75
- "cond_value": "parietal lobe",
76
  "token_index": 18
77
  },
78
  {
79
- "cond_value": "temporal lobe",
80
  "token_index": 19
81
  },
82
  {
83
- "cond_value": "occipital lobe",
84
  "token_index": 20
85
  },
86
  {
87
- "cond_value": "glioblastoma",
88
  "token_index": 21
89
  },
90
  {
91
- "cond_value": "cerebral nuclei",
92
  "token_index": 22
93
  },
94
  {
@@ -96,203 +96,203 @@
96
  "token_index": 23
97
  },
98
  {
99
- "cond_value": "dorsolateral prefrontal cortex",
100
  "token_index": 24
101
  },
102
  {
103
- "cond_value": "thalamic complex",
104
  "token_index": 25
105
  },
106
  {
107
- "cond_value": "primary motor cortex",
108
  "token_index": 26
109
  },
110
  {
111
- "cond_value": "hypothalamus",
112
  "token_index": 27
113
  },
114
  {
115
- "cond_value": "hippocampal formation",
116
  "token_index": 28
117
  },
118
  {
119
- "cond_value": "midbrain",
120
  "token_index": 29
121
  },
122
  {
123
- "cond_value": "pons",
124
  "token_index": 30
125
  },
126
  {
127
- "cond_value": "myelencephalon",
128
  "token_index": 31
129
  },
130
  {
131
- "cond_value": "cerebellum",
132
  "token_index": 32
133
  },
134
  {
135
- "cond_value": "gexscope technology",
136
  "token_index": 33
137
  },
138
  {
139
- "cond_value": "indrop",
140
  "token_index": 34
141
  },
142
  {
143
- "cond_value": "bd rhapsody whole transcriptome analysis",
144
  "token_index": 35
145
  },
146
  {
147
- "cond_value": "lung",
148
  "token_index": 36
149
  },
150
  {
151
- "cond_value": "squamous cell lung carcinoma",
152
  "token_index": 37
153
  },
154
  {
155
- "cond_value": "lung adenocarcinoma",
156
  "token_index": 38
157
  },
158
  {
159
- "cond_value": "non-small cell lung carcinoma",
160
  "token_index": 39
161
  },
162
  {
163
- "cond_value": "middle temporal gyrus",
164
  "token_index": 40
165
  },
166
  {
167
- "cond_value": "substantia nigra pars compacta",
168
  "token_index": 41
169
  },
170
  {
171
- "cond_value": "breast",
172
  "token_index": 42
173
  },
174
  {
175
- "cond_value": "10x 5' transcription profiling",
176
  "token_index": 43
177
  },
178
  {
179
- "cond_value": "lung parenchyma",
180
  "token_index": 44
181
  },
182
  {
183
- "cond_value": "lower lobe of left lung",
184
  "token_index": 45
185
  },
186
  {
187
- "cond_value": "upper lobe of left lung",
188
  "token_index": 46
189
  },
190
  {
191
- "cond_value": "brodmann (1909) area 4",
192
  "token_index": 47
193
  },
194
  {
195
- "cond_value": "prefrontal cortex",
196
  "token_index": 48
197
  },
198
  {
199
- "cond_value": "orbitofrontal cortex",
200
  "token_index": 49
201
  },
202
  {
203
- "cond_value": "anterior cingulate cortex",
204
  "token_index": 50
205
  },
206
  {
207
- "cond_value": "primary visual cortex",
208
  "token_index": 51
209
  },
210
  {
211
- "cond_value": "microwell-seq",
212
  "token_index": 52
213
  },
214
  {
215
- "cond_value": "smart-seq v4",
216
  "token_index": 53
217
  },
218
  {
219
- "cond_value": "mouse",
220
  "token_index": 54
221
  },
222
  {
223
- "cond_value": "brain meninx",
224
  "token_index": 55
225
  },
226
  {
227
- "cond_value": "sci-rna-seq",
228
  "token_index": 56
229
  },
230
  {
231
- "cond_value": "telencephalon",
232
  "token_index": 57
233
  },
234
  {
235
- "cond_value": "parietal cortex",
236
  "token_index": 58
237
  },
238
  {
239
- "cond_value": "visual cortex",
240
  "token_index": 59
241
  },
242
  {
243
- "cond_value": "entorhinal cortex",
244
  "token_index": 60
245
  },
246
  {
247
- "cond_value": "primary somatosensory cortex",
248
  "token_index": 61
249
  },
250
  {
251
- "cond_value": "agranular insular cortex",
252
  "token_index": 62
253
  },
254
  {
255
- "cond_value": "subicular complex",
256
  "token_index": 63
257
  },
258
  {
259
- "cond_value": "retrosplenial granular cortex",
260
  "token_index": 64
261
  },
262
  {
263
- "cond_value": "posterior parietal association areas",
264
  "token_index": 65
265
  },
266
  {
267
- "cond_value": "auditory cortex",
268
  "token_index": 66
269
  },
270
  {
271
- "cond_value": "temporal cortex",
272
  "token_index": 67
273
  },
274
  {
275
- "cond_value": "medial orbital frontal cortex",
276
  "token_index": 68
277
  },
278
  {
279
- "cond_value": "lateral visual area",
280
  "token_index": 69
281
  },
282
  {
283
- "cond_value": "caudate nucleus",
284
  "token_index": 70
285
  },
286
  {
287
- "cond_value": "putamen",
288
  "token_index": 71
289
  },
290
  {
291
- "cond_value": "primary auditory cortex",
292
  "token_index": 72
293
  },
294
  {
295
- "cond_value": "angular gyrus",
296
  "token_index": 73
297
  },
298
  {
@@ -300,307 +300,307 @@
300
  "token_index": 74
301
  },
302
  {
303
- "cond_value": "interventricular septum",
304
  "token_index": 75
305
  },
306
  {
307
- "cond_value": "apex of heart",
308
  "token_index": 76
309
  },
310
  {
311
- "cond_value": "heart left ventricle",
312
  "token_index": 77
313
  },
314
  {
315
- "cond_value": "heart right ventricle",
316
  "token_index": 78
317
  },
318
  {
319
- "cond_value": "left cardiac atrium",
320
  "token_index": 79
321
  },
322
  {
323
- "cond_value": "smart-seq",
324
  "token_index": 80
325
  },
326
  {
327
- "cond_value": "smart-seq2",
328
  "token_index": 81
329
  },
330
  {
331
- "cond_value": "diencephalon",
332
  "token_index": 82
333
  },
334
  {
335
- "cond_value": "brain gray matter",
336
  "token_index": 83
337
  },
338
  {
339
- "cond_value": "brain white matter",
340
  "token_index": 84
341
  },
342
  {
343
- "cond_value": "barrel cortex",
344
  "token_index": 85
345
  },
346
  {
347
- "cond_value": "cerebellar hemisphere",
348
  "token_index": 86
349
  },
350
  {
351
- "cond_value": "frontal cortex",
352
  "token_index": 87
353
  },
354
  {
355
- "cond_value": "trudrop",
356
  "token_index": 88
357
  },
358
  {
359
- "cond_value": "liver",
360
  "token_index": 89
361
  },
362
  {
363
- "cond_value": "lower lobe of right lung",
364
  "token_index": 90
365
  },
366
  {
367
- "cond_value": "upper lobe of right lung",
368
  "token_index": 91
369
  },
370
  {
371
- "cond_value": "right lung",
372
  "token_index": 92
373
  },
374
  {
375
- "cond_value": "left lung",
376
  "token_index": 93
377
  },
378
  {
379
- "cond_value": "middle lobe of right lung",
380
  "token_index": 94
381
  },
382
  {
383
- "cond_value": "transverse colon",
384
  "token_index": 95
385
  },
386
  {
387
- "cond_value": "sigmoid colon",
388
  "token_index": 96
389
  },
390
  {
391
- "cond_value": "descending colon",
392
  "token_index": 97
393
  },
394
  {
395
- "cond_value": "ascending colon",
396
  "token_index": 98
397
  },
398
  {
399
- "cond_value": "hepatic flexure of colon",
400
  "token_index": 99
401
  },
402
  {
403
- "cond_value": "hepatic cecum",
404
  "token_index": 100
405
  },
406
  {
407
- "cond_value": "rectum",
408
  "token_index": 101
409
  },
410
  {
411
- "cond_value": "kidney",
412
  "token_index": 102
413
  },
414
  {
415
- "cond_value": "lymph node",
416
  "token_index": 103
417
  },
418
  {
419
- "cond_value": "blastoma",
420
  "token_index": 104
421
  },
422
  {
423
- "cond_value": "colorectal cancer",
424
  "token_index": 105
425
  },
426
  {
427
- "cond_value": "tubular adenoma",
428
  "token_index": 106
429
  },
430
  {
431
- "cond_value": "tubulovillous adenoma",
432
  "token_index": 107
433
  },
434
  {
435
- "cond_value": "clear cell renal carcinoma",
436
  "token_index": 108
437
  },
438
  {
439
- "cond_value": "renal papilla",
440
  "token_index": 109
441
  },
442
  {
443
- "cond_value": "cortex of kidney",
444
  "token_index": 110
445
  },
446
  {
447
- "cond_value": "renal medulla",
448
  "token_index": 111
449
  },
450
  {
451
- "cond_value": "cingulate cortex",
452
  "token_index": 112
453
  },
454
  {
455
- "cond_value": "split-seq",
456
  "token_index": 113
457
  },
458
  {
459
- "cond_value": "10x 3' transcription profiling",
460
  "token_index": 114
461
  },
462
  {
463
- "cond_value": "strt-seq",
464
  "token_index": 115
465
  },
466
  {
467
- "cond_value": "pleural effusion",
468
  "token_index": 116
469
  },
470
  {
471
- "cond_value": "adrenal gland",
472
  "token_index": 117
473
  },
474
  {
475
- "cond_value": "axilla",
476
  "token_index": 118
477
  },
478
  {
479
- "cond_value": "bone spine",
480
  "token_index": 119
481
  },
482
  {
483
- "cond_value": "right parietal lobe",
484
  "token_index": 120
485
  },
486
  {
487
- "cond_value": "temporoparietal junction",
488
  "token_index": 121
489
  },
490
  {
491
- "cond_value": "left parietal lobe",
492
  "token_index": 122
493
  },
494
  {
495
- "cond_value": "small cell lung carcinoma",
496
  "token_index": 123
497
  },
498
  {
499
- "cond_value": "body of stomach",
500
  "token_index": 124
501
  },
502
  {
503
- "cond_value": "gastric cancer",
504
  "token_index": 125
505
  },
506
  {
507
- "cond_value": "lateral entorhinal cortex",
508
  "token_index": 126
509
  },
510
  {
511
- "cond_value": "retrosplenial region",
512
  "token_index": 127
513
  },
514
  {
515
- "cond_value": "anterolateral visual area",
516
  "token_index": 128
517
  },
518
  {
519
- "cond_value": "secondary somatosensory cortex",
520
  "token_index": 129
521
  },
522
  {
523
- "cond_value": "medial entorhinal cortex",
524
  "token_index": 130
525
  },
526
  {
527
- "cond_value": "gustatory cortex",
528
  "token_index": 131
529
  },
530
  {
531
- "cond_value": "claustrum of brain",
532
  "token_index": 132
533
  },
534
  {
535
- "cond_value": "caudate lobe of liver",
536
  "token_index": 133
537
  },
538
  {
539
- "cond_value": "occipital cortex",
540
  "token_index": 134
541
  },
542
  {
543
- "cond_value": "renal pelvis",
544
  "token_index": 135
545
  },
546
  {
547
- "cond_value": "kidney blood vessel",
548
  "token_index": 136
549
  },
550
  {
551
- "cond_value": "heart",
552
  "token_index": 137
553
  },
554
  {
555
- "cond_value": "scalebio single cell rna sequencing",
556
  "token_index": 138
557
  },
558
  {
559
- "cond_value": "10x 3' v1",
560
  "token_index": 139
561
  },
562
  {
563
- "cond_value": "adrenal tissue",
564
  "token_index": 140
565
  },
566
  {
567
- "cond_value": "bone marrow",
568
  "token_index": 141
569
  },
570
  {
571
- "cond_value": "b-cell non-hodgkin lymphoma",
572
  "token_index": 142
573
  },
574
  {
575
- "cond_value": "follicular lymphoma",
576
  "token_index": 143
577
  },
578
  {
579
- "cond_value": "anterior wall of left ventricle",
580
  "token_index": 144
581
  },
582
  {
583
- "cond_value": "cardiac atrium",
584
  "token_index": 145
585
  },
586
  {
587
- "cond_value": "cardiac ventricle",
588
  "token_index": 146
589
  },
590
  {
591
- "cond_value": "coronary artery",
592
  "token_index": 147
593
  },
594
  {
595
- "cond_value": "alveolus of lung",
596
  "token_index": 148
597
  },
598
  {
599
- "cond_value": "superior frontal gyrus",
600
  "token_index": 149
601
  },
602
  {
603
- "cond_value": "basal ganglion",
604
  "token_index": 150
605
  },
606
  {
@@ -608,103 +608,103 @@
608
  "token_index": 151
609
  },
610
  {
611
- "cond_value": "dronc-seq",
612
  "token_index": 152
613
  },
614
  {
615
- "cond_value": "mesonephros",
616
  "token_index": 153
617
  },
618
  {
619
- "cond_value": "renal glomerulus",
620
  "token_index": 154
621
  },
622
  {
623
- "cond_value": "outer medulla of kidney",
624
  "token_index": 155
625
  },
626
  {
627
- "cond_value": "inner medulla of kidney",
628
  "token_index": 156
629
  },
630
  {
631
- "cond_value": "anterior cingulate gyrus",
632
  "token_index": 157
633
  },
634
  {
635
- "cond_value": "cel-seq2",
636
  "token_index": 158
637
  },
638
  {
639
- "cond_value": "bd rhapsody targeted mrna",
640
  "token_index": 159
641
  },
642
  {
643
- "cond_value": "venous blood",
644
  "token_index": 160
645
  },
646
  {
647
- "cond_value": "cerebellar cortex",
648
  "token_index": 161
649
  },
650
  {
651
- "cond_value": "hemisphere part of cerebellar posterior lobe",
652
  "token_index": 162
653
  },
654
  {
655
- "cond_value": "dentate nucleus",
656
  "token_index": 163
657
  },
658
  {
659
- "cond_value": "basal zone of heart",
660
  "token_index": 164
661
  },
662
  {
663
- "cond_value": "intestine",
664
  "token_index": 165
665
  },
666
  {
667
- "cond_value": "ileum",
668
  "token_index": 166
669
  },
670
  {
671
- "cond_value": "acute myeloid leukemia",
672
  "token_index": 167
673
  },
674
  {
675
- "cond_value": "acute promyelocytic leukemia",
676
  "token_index": 168
677
  },
678
  {
679
- "cond_value": "chromophobe renal cell carcinoma",
680
  "token_index": 169
681
  },
682
  {
683
- "cond_value": "adenocarcinoma",
684
  "token_index": 170
685
  },
686
  {
687
- "cond_value": "neuroendocrine carcinoma",
688
  "token_index": 171
689
  },
690
  {
691
- "cond_value": "wilms tumor",
692
  "token_index": 172
693
  },
694
  {
695
- "cond_value": "pilocytic astrocytoma",
696
  "token_index": 173
697
  },
698
  {
699
- "cond_value": "upper outer quadrant of breast",
700
  "token_index": 174
701
  },
702
  {
703
- "cond_value": "right occipital lobe",
704
  "token_index": 175
705
  },
706
  {
707
- "cond_value": "lingula of left lung",
708
  "token_index": 176
709
  }
710
  ]
 
8
  "token_index": 1
9
  },
10
  {
11
+ "cond_value": "human",
12
  "token_index": 2
13
  },
14
  {
15
+ "cond_value": "breast",
16
  "token_index": 3
17
  },
18
  {
19
+ "cond_value": "normal",
20
  "token_index": 4
21
  },
22
  {
 
24
  "token_index": 5
25
  },
26
  {
27
+ "cond_value": "10x 3' v2",
28
  "token_index": 6
29
  },
30
  {
31
+ "cond_value": "drop-seq",
32
  "token_index": 7
33
  },
34
  {
35
+ "cond_value": "smart-seq2",
36
  "token_index": 8
37
  },
38
  {
39
+ "cond_value": "sci-rna-seq",
40
  "token_index": 9
41
  },
42
  {
43
+ "cond_value": "lung",
44
  "token_index": 10
45
  },
46
  {
47
+ "cond_value": "microwell-seq",
48
  "token_index": 11
49
  },
50
  {
51
+ "cond_value": "10x 5' v2",
52
  "token_index": 12
53
  },
54
  {
55
+ "cond_value": "10x 5' transcription profiling",
56
  "token_index": 13
57
  },
58
  {
59
+ "cond_value": "lingula of left lung",
60
  "token_index": 14
61
  },
62
  {
63
+ "cond_value": "lower lobe of left lung",
64
  "token_index": 15
65
  },
66
  {
67
+ "cond_value": "upper lobe of left lung",
68
  "token_index": 16
69
  },
70
  {
71
+ "cond_value": "10x 3' transcription profiling",
72
  "token_index": 17
73
  },
74
  {
75
+ "cond_value": "blood",
76
  "token_index": 18
77
  },
78
  {
79
+ "cond_value": "thalamic complex",
80
  "token_index": 19
81
  },
82
  {
83
+ "cond_value": "hypothalamus",
84
  "token_index": 20
85
  },
86
  {
87
+ "cond_value": "midbrain",
88
  "token_index": 21
89
  },
90
  {
91
+ "cond_value": "pons",
92
  "token_index": 22
93
  },
94
  {
 
96
  "token_index": 23
97
  },
98
  {
99
+ "cond_value": "myelencephalon",
100
  "token_index": 24
101
  },
102
  {
103
+ "cond_value": "cerebral nuclei",
104
  "token_index": 25
105
  },
106
  {
107
+ "cond_value": "hippocampal formation",
108
  "token_index": 26
109
  },
110
  {
111
+ "cond_value": "cerebellum",
112
  "token_index": 27
113
  },
114
  {
115
+ "cond_value": "interventricular septum",
116
  "token_index": 28
117
  },
118
  {
119
+ "cond_value": "heart left ventricle",
120
  "token_index": 29
121
  },
122
  {
123
+ "cond_value": "heart right ventricle",
124
  "token_index": 30
125
  },
126
  {
127
+ "cond_value": "apex of heart",
128
  "token_index": 31
129
  },
130
  {
131
+ "cond_value": "cardiac atrium",
132
  "token_index": 32
133
  },
134
  {
135
+ "cond_value": "cardiac ventricle",
136
  "token_index": 33
137
  },
138
  {
139
+ "cond_value": "coronary artery",
140
  "token_index": 34
141
  },
142
  {
143
+ "cond_value": "heart",
144
  "token_index": 35
145
  },
146
  {
147
+ "cond_value": "temporal cortex",
148
  "token_index": 36
149
  },
150
  {
151
+ "cond_value": "primary motor cortex",
152
  "token_index": 37
153
  },
154
  {
155
+ "cond_value": "prefrontal cortex",
156
  "token_index": 38
157
  },
158
  {
159
+ "cond_value": "parietal cortex",
160
  "token_index": 39
161
  },
162
  {
163
+ "cond_value": "primary somatosensory cortex",
164
  "token_index": 40
165
  },
166
  {
167
+ "cond_value": "primary visual cortex",
168
  "token_index": 41
169
  },
170
  {
171
+ "cond_value": "dorsolateral prefrontal cortex",
172
  "token_index": 42
173
  },
174
  {
175
+ "cond_value": "strt-seq",
176
  "token_index": 43
177
  },
178
  {
179
+ "cond_value": "bd rhapsody whole transcriptome analysis",
180
  "token_index": 44
181
  },
182
  {
183
+ "cond_value": "brain",
184
  "token_index": 45
185
  },
186
  {
187
+ "cond_value": "lymph node",
188
  "token_index": 46
189
  },
190
  {
191
+ "cond_value": "pleural effusion",
192
  "token_index": 47
193
  },
194
  {
195
+ "cond_value": "liver",
196
  "token_index": 48
197
  },
198
  {
199
+ "cond_value": "adrenal gland",
200
  "token_index": 49
201
  },
202
  {
203
+ "cond_value": "axilla",
204
  "token_index": 50
205
  },
206
  {
207
+ "cond_value": "bone spine",
208
  "token_index": 51
209
  },
210
  {
211
+ "cond_value": "left temporal lobe",
212
  "token_index": 52
213
  },
214
  {
215
+ "cond_value": "right frontal lobe",
216
  "token_index": 53
217
  },
218
  {
219
+ "cond_value": "right parietal lobe",
220
  "token_index": 54
221
  },
222
  {
223
+ "cond_value": "right temporal lobe",
224
  "token_index": 55
225
  },
226
  {
227
+ "cond_value": "forebrain",
228
  "token_index": 56
229
  },
230
  {
231
+ "cond_value": "left frontal lobe",
232
  "token_index": 57
233
  },
234
  {
235
+ "cond_value": "temporoparietal junction",
236
  "token_index": 58
237
  },
238
  {
239
+ "cond_value": "left parietal lobe",
240
  "token_index": 59
241
  },
242
  {
243
+ "cond_value": "lung adenocarcinoma",
244
  "token_index": 60
245
  },
246
  {
247
+ "cond_value": "small cell lung carcinoma",
248
  "token_index": 61
249
  },
250
  {
251
+ "cond_value": "glioblastoma",
252
  "token_index": 62
253
  },
254
  {
255
+ "cond_value": "smart-seq v4",
256
  "token_index": 63
257
  },
258
  {
259
+ "cond_value": "anterior cingulate cortex",
260
  "token_index": 64
261
  },
262
  {
263
+ "cond_value": "angular gyrus",
264
  "token_index": 65
265
  },
266
  {
267
+ "cond_value": "primary auditory cortex",
268
  "token_index": 66
269
  },
270
  {
271
+ "cond_value": "middle temporal gyrus",
272
  "token_index": 67
273
  },
274
  {
275
+ "cond_value": "anterior cingulate gyrus",
276
  "token_index": 68
277
  },
278
  {
279
+ "cond_value": "mouse",
280
  "token_index": 69
281
  },
282
  {
283
+ "cond_value": "diencephalon",
284
  "token_index": 70
285
  },
286
  {
287
+ "cond_value": "parietal lobe",
288
  "token_index": 71
289
  },
290
  {
291
+ "cond_value": "temporal lobe",
292
  "token_index": 72
293
  },
294
  {
295
+ "cond_value": "frontal lobe",
296
  "token_index": 73
297
  },
298
  {
 
300
  "token_index": 74
301
  },
302
  {
303
+ "cond_value": "left cardiac atrium",
304
  "token_index": 75
305
  },
306
  {
307
+ "cond_value": "10x 3' v1",
308
  "token_index": 76
309
  },
310
  {
311
+ "cond_value": "lung parenchyma",
312
  "token_index": 77
313
  },
314
  {
315
+ "cond_value": "anterior wall of left ventricle",
316
  "token_index": 78
317
  },
318
  {
319
+ "cond_value": "cortex of kidney",
320
  "token_index": 79
321
  },
322
  {
323
+ "cond_value": "kidney",
324
  "token_index": 80
325
  },
326
  {
327
+ "cond_value": "renal medulla",
328
  "token_index": 81
329
  },
330
  {
331
+ "cond_value": "renal pelvis",
332
  "token_index": 82
333
  },
334
  {
335
+ "cond_value": "kidney blood vessel",
336
  "token_index": 83
337
  },
338
  {
339
+ "cond_value": "non-small cell lung carcinoma",
340
  "token_index": 84
341
  },
342
  {
343
+ "cond_value": "squamous cell lung carcinoma",
344
  "token_index": 85
345
  },
346
  {
347
+ "cond_value": "substantia nigra pars compacta",
348
  "token_index": 86
349
  },
350
  {
351
+ "cond_value": "entorhinal cortex",
352
  "token_index": 87
353
  },
354
  {
355
+ "cond_value": "occipital lobe",
356
  "token_index": 88
357
  },
358
  {
359
+ "cond_value": "umbilical cord blood",
360
  "token_index": 89
361
  },
362
  {
363
+ "cond_value": "occipital cortex",
364
  "token_index": 90
365
  },
366
  {
367
+ "cond_value": "frontal cortex",
368
  "token_index": 91
369
  },
370
  {
371
+ "cond_value": "seq-well",
372
  "token_index": 92
373
  },
374
  {
375
+ "cond_value": "brain meninx",
376
  "token_index": 93
377
  },
378
  {
379
+ "cond_value": "scalebio single cell rna sequencing",
380
  "token_index": 94
381
  },
382
  {
383
+ "cond_value": "retrosplenial granular cortex",
384
  "token_index": 95
385
  },
386
  {
387
+ "cond_value": "visual cortex",
388
  "token_index": 96
389
  },
390
  {
391
+ "cond_value": "agranular insular cortex",
392
  "token_index": 97
393
  },
394
  {
395
+ "cond_value": "auditory cortex",
396
  "token_index": 98
397
  },
398
  {
399
+ "cond_value": "subicular complex",
400
  "token_index": 99
401
  },
402
  {
403
+ "cond_value": "medial orbital frontal cortex",
404
  "token_index": 100
405
  },
406
  {
407
+ "cond_value": "lateral visual area",
408
  "token_index": 101
409
  },
410
  {
411
+ "cond_value": "posterior parietal association areas",
412
  "token_index": 102
413
  },
414
  {
415
+ "cond_value": "telencephalon",
416
  "token_index": 103
417
  },
418
  {
419
+ "cond_value": "brodmann (1909) area 4",
420
  "token_index": 104
421
  },
422
  {
423
+ "cond_value": "trudrop",
424
  "token_index": 105
425
  },
426
  {
427
+ "cond_value": "lower lobe of right lung",
428
  "token_index": 106
429
  },
430
  {
431
+ "cond_value": "upper lobe of right lung",
432
  "token_index": 107
433
  },
434
  {
435
+ "cond_value": "right lung",
436
  "token_index": 108
437
  },
438
  {
439
+ "cond_value": "left lung",
440
  "token_index": 109
441
  },
442
  {
443
+ "cond_value": "middle lobe of right lung",
444
  "token_index": 110
445
  },
446
  {
447
+ "cond_value": "transverse colon",
448
  "token_index": 111
449
  },
450
  {
451
+ "cond_value": "sigmoid colon",
452
  "token_index": 112
453
  },
454
  {
455
+ "cond_value": "descending colon",
456
  "token_index": 113
457
  },
458
  {
459
+ "cond_value": "ascending colon",
460
  "token_index": 114
461
  },
462
  {
463
+ "cond_value": "hepatic flexure of colon",
464
  "token_index": 115
465
  },
466
  {
467
+ "cond_value": "hepatic cecum",
468
  "token_index": 116
469
  },
470
  {
471
+ "cond_value": "rectum",
472
  "token_index": 117
473
  },
474
  {
475
+ "cond_value": "blastoma",
476
  "token_index": 118
477
  },
478
  {
479
+ "cond_value": "colorectal cancer",
480
  "token_index": 119
481
  },
482
  {
483
+ "cond_value": "tubular adenoma",
484
  "token_index": 120
485
  },
486
  {
487
+ "cond_value": "tubulovillous adenoma",
488
  "token_index": 121
489
  },
490
  {
491
+ "cond_value": "clear cell renal carcinoma",
492
  "token_index": 122
493
  },
494
  {
495
+ "cond_value": "cerebellar cortex",
496
  "token_index": 123
497
  },
498
  {
499
+ "cond_value": "hemisphere part of cerebellar posterior lobe",
500
  "token_index": 124
501
  },
502
  {
503
+ "cond_value": "dentate nucleus",
504
  "token_index": 125
505
  },
506
  {
507
+ "cond_value": "split-seq",
508
  "token_index": 126
509
  },
510
  {
511
+ "cond_value": "caudate lobe of liver",
512
  "token_index": 127
513
  },
514
  {
515
+ "cond_value": "bd rhapsody targeted mrna",
516
  "token_index": 128
517
  },
518
  {
519
+ "cond_value": "venous blood",
520
  "token_index": 129
521
  },
522
  {
523
+ "cond_value": "gexscope technology",
524
  "token_index": 130
525
  },
526
  {
527
+ "cond_value": "adrenal tissue",
528
  "token_index": 131
529
  },
530
  {
531
+ "cond_value": "indrop",
532
  "token_index": 132
533
  },
534
  {
535
+ "cond_value": "basal ganglion",
536
  "token_index": 133
537
  },
538
  {
539
+ "cond_value": "intestine",
540
  "token_index": 134
541
  },
542
  {
543
+ "cond_value": "lateral entorhinal cortex",
544
  "token_index": 135
545
  },
546
  {
547
+ "cond_value": "retrosplenial region",
548
  "token_index": 136
549
  },
550
  {
551
+ "cond_value": "anterolateral visual area",
552
  "token_index": 137
553
  },
554
  {
555
+ "cond_value": "secondary somatosensory cortex",
556
  "token_index": 138
557
  },
558
  {
559
+ "cond_value": "medial entorhinal cortex",
560
  "token_index": 139
561
  },
562
  {
563
+ "cond_value": "gustatory cortex",
564
  "token_index": 140
565
  },
566
  {
567
+ "cond_value": "claustrum of brain",
568
  "token_index": 141
569
  },
570
  {
571
+ "cond_value": "alveolus of lung",
572
  "token_index": 142
573
  },
574
  {
575
+ "cond_value": "body of stomach",
576
  "token_index": 143
577
  },
578
  {
579
+ "cond_value": "gastric cancer",
580
  "token_index": 144
581
  },
582
  {
583
+ "cond_value": "cel-seq2",
584
  "token_index": 145
585
  },
586
  {
587
+ "cond_value": "renal papilla",
588
  "token_index": 146
589
  },
590
  {
591
+ "cond_value": "upper outer quadrant of breast",
592
  "token_index": 147
593
  },
594
  {
595
+ "cond_value": "caudate nucleus",
596
  "token_index": 148
597
  },
598
  {
599
+ "cond_value": "putamen",
600
  "token_index": 149
601
  },
602
  {
603
+ "cond_value": "cingulate cortex",
604
  "token_index": 150
605
  },
606
  {
 
608
  "token_index": 151
609
  },
610
  {
611
+ "cond_value": "bone marrow",
612
  "token_index": 152
613
  },
614
  {
615
+ "cond_value": "b-cell non-hodgkin lymphoma",
616
  "token_index": 153
617
  },
618
  {
619
+ "cond_value": "follicular lymphoma",
620
  "token_index": 154
621
  },
622
  {
623
+ "cond_value": "smart-seq",
624
  "token_index": 155
625
  },
626
  {
627
+ "cond_value": "brain gray matter",
628
  "token_index": 156
629
  },
630
  {
631
+ "cond_value": "brain white matter",
632
  "token_index": 157
633
  },
634
  {
635
+ "cond_value": "barrel cortex",
636
  "token_index": 158
637
  },
638
  {
639
+ "cond_value": "cerebellar hemisphere",
640
  "token_index": 159
641
  },
642
  {
643
+ "cond_value": "ileum",
644
  "token_index": 160
645
  },
646
  {
647
+ "cond_value": "acute myeloid leukemia",
648
  "token_index": 161
649
  },
650
  {
651
+ "cond_value": "acute promyelocytic leukemia",
652
  "token_index": 162
653
  },
654
  {
655
+ "cond_value": "chromophobe renal cell carcinoma",
656
  "token_index": 163
657
  },
658
  {
659
+ "cond_value": "adenocarcinoma",
660
  "token_index": 164
661
  },
662
  {
663
+ "cond_value": "neuroendocrine carcinoma",
664
  "token_index": 165
665
  },
666
  {
667
+ "cond_value": "wilms tumor",
668
  "token_index": 166
669
  },
670
  {
671
+ "cond_value": "pilocytic astrocytoma",
672
  "token_index": 167
673
  },
674
  {
675
+ "cond_value": "orbitofrontal cortex",
676
  "token_index": 168
677
  },
678
  {
679
+ "cond_value": "right occipital lobe",
680
  "token_index": 169
681
  },
682
  {
683
+ "cond_value": "dronc-seq",
684
  "token_index": 170
685
  },
686
  {
687
+ "cond_value": "mesonephros",
688
  "token_index": 171
689
  },
690
  {
691
+ "cond_value": "renal glomerulus",
692
  "token_index": 172
693
  },
694
  {
695
+ "cond_value": "outer medulla of kidney",
696
  "token_index": 173
697
  },
698
  {
699
+ "cond_value": "inner medulla of kidney",
700
  "token_index": 174
701
  },
702
  {
703
+ "cond_value": "superior frontal gyrus",
704
  "token_index": 175
705
  },
706
  {
707
+ "cond_value": "basal zone of heart",
708
  "token_index": 176
709
  }
710
  ]
models/sfm_config.json CHANGED
@@ -1,19 +1,18 @@
1
  {
2
  "sfm": {
3
  "embed_dim": 768,
4
- "expr_hidden_dim": 768,
5
- "expr_dropout": 0.1,
6
- "expr_value_scale": 1.0,
7
- "mod_hidden_dim": 768,
8
- "mod_dropout": 0.1,
 
9
  "cond_dropout": 0.1,
10
- "context_hidden_dim": 768,
11
- "context_dropout": 0.1,
12
- "embedding_dropout": 0.1,
13
  "freeze_loaded_gene_embeddings": false,
14
  "num_layers": 12,
15
  "num_heads": 12,
16
- "backbone_mlp_hidden_dim": 2048,
17
  "backbone_mlp_dropout": 0.02,
18
  "use_rotary": false,
19
  "qkv_bias": true,
@@ -25,7 +24,7 @@
25
  "num_factors": 256,
26
  "router_hidden_dim": 1024,
27
  "router_dropout": 0.1,
28
- "topk": 24,
29
  "router_temperature": 0.7,
30
  "beta_momentum": 0.1
31
  },
 
1
  {
2
  "sfm": {
3
  "embed_dim": 768,
4
+ "expr_num_bins": 32,
5
+ "expr_hidden_dim": 128,
6
+ "expr_tau": 1.0,
7
+ "batch_num_bins": 128,
8
+ "batch_hidden_dim": 128,
9
+ "batch_tau": 1.0,
10
  "cond_dropout": 0.1,
11
+ "out_dropout": 0.1,
 
 
12
  "freeze_loaded_gene_embeddings": false,
13
  "num_layers": 12,
14
  "num_heads": 12,
15
+ "backbone_mlp_hidden_dim": 3072,
16
  "backbone_mlp_dropout": 0.02,
17
  "use_rotary": false,
18
  "qkv_bias": true,
 
24
  "num_factors": 256,
25
  "router_hidden_dim": 1024,
26
  "router_dropout": 0.1,
27
+ "topk": 32,
28
  "router_temperature": 0.7,
29
  "beta_momentum": 0.1
30
  },
models/sfm_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:748070c393b74de89998967aa6fe79bfda4e98db43184072e23b86f29e0dcb81
3
- size 605872652
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e010e29145bbd3b2bce5aca9d188cfd5aa6aeae32dcfd5534ea65f67967c95c5
3
+ size 541486920