AngelPanizo's picture
Add BERTopic model
daed828 verified
{
"ctfidf_model": {
"bm25_weighting": false,
"reduce_frequent_words": true
},
"vectorizer_model": {
"params": {
"analyzer": "word",
"binary": false,
"decode_error": "strict",
"encoding": "utf-8",
"input": "content",
"lowercase": true,
"max_df": 0.8,
"max_features": null,
"min_df": 1,
"ngram_range": [
1,
1
],
"stop_words": [
"i",
"me",
"my",
"myself",
"we",
"our",
"ours",
"ourselves",
"you",
"you're",
"you've",
"you'll",
"you'd",
"your",
"yours",
"yourself",
"yourselves",
"he",
"him",
"his",
"himself",
"she",
"she's",
"her",
"hers",
"herself",
"it",
"it's",
"its",
"itself",
"they",
"them",
"their",
"theirs",
"themselves",
"what",
"which",
"who",
"whom",
"this",
"that",
"that'll",
"these",
"those",
"am",
"is",
"are",
"was",
"were",
"be",
"been",
"being",
"have",
"has",
"had",
"having",
"do",
"does",
"did",
"doing",
"a",
"an",
"the",
"and",
"but",
"if",
"or",
"because",
"as",
"until",
"while",
"of",
"at",
"by",
"for",
"with",
"about",
"against",
"between",
"into",
"through",
"during",
"before",
"after",
"above",
"below",
"to",
"from",
"up",
"down",
"in",
"out",
"on",
"off",
"over",
"under",
"again",
"further",
"then",
"once",
"here",
"there",
"when",
"where",
"why",
"how",
"all",
"any",
"both",
"each",
"few",
"more",
"most",
"other",
"some",
"such",
"no",
"nor",
"not",
"only",
"own",
"same",
"so",
"than",
"too",
"very",
"s",
"t",
"can",
"will",
"just",
"don",
"don't",
"should",
"should've",
"now",
"d",
"ll",
"m",
"o",
"re",
"ve",
"y",
"ain",
"aren",
"aren't",
"couldn",
"couldn't",
"didn",
"didn't",
"doesn",
"doesn't",
"hadn",
"hadn't",
"hasn",
"hasn't",
"haven",
"haven't",
"isn",
"isn't",
"ma",
"mightn",
"mightn't",
"mustn",
"mustn't",
"needn",
"needn't",
"shan",
"shan't",
"shouldn",
"shouldn't",
"wasn",
"wasn't",
"weren",
"weren't",
"won",
"won't",
"wouldn",
"wouldn't",
"worldwidewakeup"
],
"strip_accents": "unicode",
"token_pattern": "(?u)\\b\\w\\w+\\b",
"vocabulary": null
},
"vocab": {
"unvaccinated": 923,
"singles": 792,
"dating": 225,
"like": 498,
"minded": 563,
"adults": 36,
"started": 823,
"private": 679,
"facebook": 309,
"challenge": 153,
"finding": 327,
"someone": 805,
"align": 42,
"important": 441,
"decisions": 235,
"become": 87,
"apparent": 62,
"recently": 717,
"looking": 512,
"partner": 625,
"experiencing": 302,
"shedding": 775,
"symptoms": 862,
"relationships": 726,
"breaking": 119,
"parents": 622,
"agreeing": 39,
"vaccinate": 932,
"born": 116,
"cater": 149,
"wish": 971,
"find": 326,
"page": 619,
"regarding": 720,
"stance": 819,
"welcome": 964,
"invite": 455,
"single": 791,
"groups": 387,
"ussocial": 931,
"york": 993,
"please": 657,
"stop": 837,
"channels": 157,
"take": 864,
"back": 79,
"country": 202,
"people": 639,
"put": 698,
"power": 670,
"need": 581,
"know": 476,
"peoples": 640,
"voices": 943,
"matter": 543,
"mainstream": 519,
"news": 585,
"claiming": 169,
"hundreds": 433,
"stormed": 839,
"palace": 621,
"maybe": 544,
"go": 372,
"math": 541,
"class": 170,
"globalists": 370,
"great": 383,
"reset": 732,
"build": 126,
"better": 95,
"plan": 651,
"happen": 396,
"allow": 44,
"still": 834,
"calling": 137,
"conspiracy": 187,
"theorists": 882,
"wake": 946,
"millions": 562,
"protesting": 690,
"globally": 371,
"reason": 714,
"donkey": 257,
"arizona": 64,
"firefighters": 329,
"hoist": 418,
"large": 479,
"american": 52,
"flag": 334,
"convoy": 194,
"makes": 522,
"way": 956,
"let": 494,
"freedom": 346,
"dc": 230,
"yesterday": 991,
"23": 10,
"22": 9,
"participants": 624,
"california": 136,
"kick": 472,
"singing": 790,
"amazing": 51,
"grace": 380,
"unacceptable": 914,
"canadian": 140,
"government": 379,
"crossed": 215,
"line": 500,
"attacking": 71,
"peaceful": 636,
"protesters": 689,
"horses": 427,
"including": 443,
"elderly": 270,
"woman": 975,
"walker": 947,
"rumor": 743,
"one": 608,
"man": 523,
"killed": 474,
"trying": 906,
"confirm": 183,
"safe": 746,
"watching": 954,
"canberra": 141,
"million": 561,
"cars": 148,
"converged": 193,
"australia": 75,
"capital": 142,
"end": 280,
"covid": 207,
"regime": 723,
"cowboys": 209,
"showed": 781,
"alberta": 41,
"coutta": 206,
"border": 114,
"blockade": 105,
"hundred": 432,
"plus": 658,
"happening": 398,
"music": 576,
"said": 747,
"publicly": 694,
"play": 654,
"anywhere": 61,
"asking": 68,
"cards": 143,
"2022": 8,
"turned": 909,
"massive": 539,
"dance": 222,
"party": 627,
"ottawa": 614,
"night": 589,
"ready": 711,
"first": 330,
"street": 841,
"alongside": 47,
"quebec": 700,
"high": 412,
"school": 757,
"students": 845,
"stage": 818,
"protest": 688,
"mandatory": 528,
"mask": 537,
"chants": 158,
"breathe": 120,
"hearing": 406,
"sources": 809,
"truckers": 903,
"prepared": 675,
"hope": 425,
"outcomes": 615,
"heard": 405,
"questioning": 701,
"planned": 653,
"disrupt": 249,
"supply": 852,
"chain": 152,
"sure": 855,
"truth": 905,
"deserve": 244,
"give": 367,
"january": 463,
"29": 14,
"canada": 139,
"trucker": 902,
"arrived": 65,
"australian": 76,
"estimates": 290,
"least": 489,
"20": 5,
"000": 0,
"going": 376,
"heading": 401,
"city": 168,
"revolution": 735,
"spreading": 815,
"worldwide": 980,
"beautiful": 86,
"thing": 883,
"see": 763,
"largest": 480,
"nearly": 580,
"half": 392,
"trucks": 904,
"growing": 388,
"blocking": 106,
"boarders": 108,
"5million": 21,
"dollar": 255,
"raised": 706,
"support": 853,
"mandates": 527,
"move": 570,
"tyrannical": 912,
"withdraws": 972,
"building": 128,
"since": 789,
"weekend": 959,
"apparently": 63,
"already": 48,
"joining": 467,
"following": 336,
"announced": 55,
"thousands": 886,
"ca": 133,
"15": 2,
"mi": 558,
"10": 1,
"oh": 607,
"il": 437,
"tx": 911,
"ny": 598,
"wa": 944,
"fl": 333,
"must": 577,
"freedomconvoy2022": 347,
"taking": 866,
"action": 31,
"passports": 631,
"think": 885,
"deserves": 245,
"medal": 548,
"pages": 620,
"videos": 940,
"show": 780,
"70km": 25,
"long": 510,
"marching": 535,
"del": 238,
"bigtree": 98,
"highwire": 415,
"defeat": 237,
"march": 534,
"washington": 951,
"gather": 361,
"front": 348,
"lincoln": 499,
"memorial": 553,
"speakers": 812,
"rally": 707,
"bilbao": 99,
"spain": 810,
"mass": 538,
"demonstration": 241,
"nwo": 597,
"30": 16,
"message": 556,
"boris": 115,
"say": 752,
"stand": 820,
"nhs": 587,
"staff": 817,
"70": 24,
"unjabbed": 922,
"world": 979,
"wide": 968,
"london": 509,
"uk": 913,
"laying": 486,
"uniforms": 920,
"steps": 833,
"trafalgar": 900,
"square": 816,
"right": 737,
"deadline": 232,
"mandate": 525,
"draws": 262,
"closer": 172,
"demonstrations": 242,
"planet": 652,
"favor": 317,
"pre": 671,
"dinner": 246,
"getting": 365,
"excited": 296,
"santiago": 750,
"chile": 163,
"institution": 451,
"stronghold": 843,
"corporation": 197,
"carrying": 147,
"sinovac": 793,
"bioweapon": 101,
"studies": 846,
"kids": 473,
"dying": 263,
"serious": 772,
"health": 403,
"problems": 680,
"ormeau": 612,
"qld": 699,
"small": 800,
"cafe": 134,
"targeted": 867,
"recent": 716,
"days": 229,
"officers": 604,
"alleged": 43,
"passport": 630,
"breaches": 118,
"gets": 364,
"surrounded": 857,
"protected": 687,
"seattle": 761,
"fire": 328,
"police": 662,
"discharged": 248,
"noncompliance": 591,
"watch": 952,
"turn": 908,
"boots": 113,
"hall": 393,
"subscribe": 847,
"italy": 460,
"october": 601,
"19": 4,
"2021": 7,
"bring": 124,
"food": 337,
"port": 665,
"genoa": 362,
"day": 227,
"fury": 353,
"melbourne": 551,
"chaos": 159,
"construction": 189,
"industry": 447,
"says": 754,
"jab": 462,
"angry": 54,
"attempted": 72,
"shutdown": 782,
"highway": 414,
"struggled": 844,
"get": 363,
"grip": 386,
"using": 930,
"rubber": 742,
"bullets": 129,
"tear": 869,
"gas": 359,
"belong": 90,
"religion": 728,
"god": 374,
"given": 368,
"manipulation": 532,
"sin": 788,
"manipulations": 533,
"always": 50,
"used": 929,
"profits": 682,
"constructers": 188,
"owners": 617,
"suppress": 854,
"far": 314,
"majority": 520,
"also": 49,
"human": 430,
"elite": 272,
"decide": 234,
"others": 613,
"best": 93,
"creator": 212,
"replace": 729,
"function": 352,
"manipulate": 531,
"creation": 211,
"worst": 983,
"possible": 667,
"sabmyk": 745,
"state": 825,
"premier": 672,
"dan": 221,
"andrews": 53,
"condemned": 182,
"terrible": 877,
"behavior": 88,
"west": 966,
"bridge": 122,
"gate": 360,
"manic": 530,
"scenes": 756,
"suspended": 858,
"two": 910,
"weeks": 961,
"workers": 978,
"fight": 320,
"vaccines": 934,
"theeuropenews": 881,
"grassroots": 381,
"information": 448,
"activists": 32,
"come": 173,
"rain": 705,
"shine": 776,
"fighting": 321,
"pass": 628,
"nice": 588,
"france": 345,
"enter": 288,
"train": 901,
"station": 826,
"occupy": 599,
"tracks": 899,
"second": 762,
"weekly": 960,
"sidewalk": 784,
"picnic": 648,
"held": 408,
"calgary": 135,
"chinada": 164,
"perfect": 641,
"song": 807,
"thanks": 880,
"band": 82,
"pesky": 647,
"2nd": 15,
"undocumented": 917,
"citizens": 167,
"enjoyed": 286,
"liberty": 495,
"sandwiches": 749,
"together": 894,
"meanwhile": 546,
"fully": 351,
"documented": 254,
"seemed": 764,
"deserted": 243,
"purveyors": 697,
"oct": 600,
"university": 921,
"make": 521,
"passionate": 629,
"plea": 656,
"illegal": 438,
"enforced": 284,
"baffled": 81,
"believes": 89,
"hoax": 417,
"worse": 982,
"yet": 992,
"wants": 950,
"enforce": 283,
"experimental": 303,
"perfectly": 642,
"healthy": 404,
"youth": 995,
"listen": 502,
"hands": 395,
"deck": 236,
"another": 56,
"zealand": 996,
"finally": 325,
"communist": 176,
"controlled": 192,
"starting": 824,
"rise": 738,
"brilliant": 123,
"green": 384,
"young": 994,
"brave": 117,
"stood": 836,
"job": 465,
"well": 965,
"done": 256,
"next": 586,
"week": 958,
"lives": 505,
"vaxxed": 935,
"unvaxxed": 924,
"order": 610,
"straighten": 840,
"mess": 555,
"humanity": 431,
"threat": 887,
"set": 773,
"former": 342,
"aussie": 74,
"airline": 40,
"pilot": 649,
"refused": 719,
"mandated": 526,
"tells": 875,
"politicians": 663,
"swiss": 861,
"bern": 92,
"crowds": 216,
"storm": 838,
"main": 518,
"railway": 704,
"thursday": 890,
"marked": 536,
"fourth": 344,
"consecutive": 186,
"evening": 292,
"protests": 691,
"forces": 340,
"vaccination": 933,
"status": 827,
"permitted": 644,
"restaurants": 733,
"bars": 84,
"public": 693,
"venues": 936,
"looming": 513,
"atrocity": 69,
"really": 713,
"stock": 835,
"things": 884,
"care": 144,
"danny": 223,
"rampling": 708,
"sept": 771,
"25th": 12,
"interviews": 454,
"unwashed2020": 925,
"revolutie": 734,
"italie": 459,
"35": 17,
"blokkeren": 107,
"de": 231,
"snelwegen": 802,
"inmiddels": 449,
"hebben": 407,
"boeren": 109,
"zich": 997,
"aangesloten": 27,
"en": 279,
"lokale": 508,
"wegen": 963,
"kacunas": 469,
"globalism": 369,
"biggest": 97,
"slovenia": 799,
"demonstrate": 240,
"block": 104,
"roads": 739,
"ljubljana": 507,
"work": 977,
"access": 29,
"shopping": 778,
"center": 151,
"demanding": 239,
"early": 264,
"elections": 271,
"saturday": 751,
"reported": 731,
"adelaide": 34,
"came": 138,
"force": 339,
"enough": 287,
"fake": 310,
"msm": 573,
"channel": 156,
"chat": 161,
"five": 332,
"report": 730,
"nurses": 596,
"courage": 204,
"currently": 219,
"silent": 786,
"whilst": 967,
"social": 803,
"distancing": 250,
"idea": 435,
"even": 291,
"chopper": 166,
"good": 378,
"ya": 987,
"strong": 842,
"anti": 58,
"istanbul": 458,
"slaves": 797,
"speaker": 811,
"copied": 195,
"pasted": 632,
"karen": 470,
"brewers": 121,
"victoria": 938,
"edinborough": 269,
"gardens": 358,
"fitzroy": 331,
"teachers": 868,
"silently": 787,
"standing": 821,
"holding": 419,
"hey": 410,
"guys": 390,
"viewing": 942,
"ends": 281,
"tonight": 896,
"midnight": 559,
"miss": 564,
"late": 482,
"officially": 605,
"last": 481,
"movie": 571,
"read": 710,
"note": 592,
"attached": 70,
"explain": 305,
"unfortunately": 919,
"telegram": 872,
"allows": 45,
"much": 574,
"text": 878,
"post": 668,
"regards": 722,
"healing": 402,
"made": 517,
"fyi": 355,
"available": 77,
"price": 677,
"bump": 130,
"full": 350,
"left": 492,
"real": 712,
"anthony": 57,
"fauci": 316,
"modules": 566,
"sale": 748,
"scroll": 759,
"movies": 572,
"click": 171,
"package": 618,
"image": 439,
"love": 515,
"jm": 464,
"admin": 35,
"use": 928,
"want": 948,
"highlight": 413,
"something": 806,
"followers": 335,
"specifically": 813,
"mentioned": 554,
"yay": 988,
"interested": 452,
"producers": 681,
"hard": 400,
"copies": 196,
"film": 324,
"includes": 442,
"reference": 718,
"wanted": 949,
"point": 660,
"tomorrow": 895,
"goes": 375,
"might": 560,
"along": 46,
"purchase": 696,
"learn": 488,
"part": 623,
"share": 774,
"live": 504,
"sneak": 801,
"peek": 637,
"parts": 626,
"27th": 13,
"hurry": 434,
"separate": 770,
"video": 939,
"players": 655,
"screen": 758,
"able": 28,
"view": 941,
"sign": 785,
"rfk": 736,
"jr": 468,
"feature": 318,
"length": 493,
"popcorn": 664,
"enjoy": 285,
"window": 970,
"watched": 953,
"chance": 154,
"expose": 306,
"maniacs": 529,
"hi": 411,
"website": 957,
"update": 926,
"slept": 798,
"exhausted": 299,
"managed": 524,
"figure": 322,
"issue": 457,
"covidvaccinevictims": 208,
"mistake": 565,
"changed": 155,
"dns": 251,
"forwarding": 343,
"backend": 80,
"caused": 150,
"ip": 456,
"address": 33,
"match": 540,
"needed": 582,
"properly": 686,
"bit": 103,
"technical": 871,
"builder": 127,
"figured": 323,
"needs": 583,
"propagate": 685,
"running": 744,
"correctly": 198,
"hopefully": 426,
"soon": 808,
"within": 973,
"24": 11,
"hours": 428,
"patience": 633,
"receive": 715,
"couple": 203,
"nasty": 578,
"emails": 275,
"complaining": 180,
"nothing": 593,
"concern": 181,
"takes": 865,
"lot": 514,
"time": 891,
"money": 567,
"emotions": 277,
"energy": 282,
"understanding": 916,
"patient": 634,
"thank": 879,
"staying": 829,
"meantime": 545,
"teaser": 870,
"updating": 927,
"exciting": 297,
"documentary": 253,
"robert": 740,
"kennedy": 471,
"based": 85,
"times": 892,
"bestselling": 94,
"book": 111,
"releases": 727,
"tuesday": 907,
"regardless": 721,
"forget": 341,
"family": 312,
"media": 549,
"murder": 575,
"countdown": 201,
"gain": 356,
"incredible": 445,
"8p": 26,
"est": 289,
"5pm": 22,
"pst": 692,
"posting": 669,
"premiere": 673,
"date": 224,
"short": 779,
"period": 643,
"notified": 595,
"personally": 646,
"send": 768,
"everyone": 294,
"else": 273,
"sees": 765,
"happy": 399,
"offer": 602,
"asked": 67,
"month": 568,
"ago": 38,
"promoting": 684,
"spellbinding": 814,
"selling": 767,
"honor": 424,
"big": 96,
"feel": 319,
"exposing": 307,
"little": 503,
"rat": 709,
"top": 897,
"list": 501,
"often": 606,
"daydream": 228,
"sitting": 794,
"interview": 453,
"telling": 874,
"choice": 165,
"words": 976,
"memes": 552,
"sunglasses": 851,
"fall": 311,
"person": 645,
"face": 308,
"thug": 889,
"scrolls": 760,
"across": 30,
"yeah": 989,
"goal": 373,
"haha": 391,
"sunday": 850,
"pm": 659,
"sending": 769,
"notification": 594,
"via": 937,
"email": 274,
"register": 724,
"guy": 389,
"sick": 783,
"ow": 616,
"banned": 83,
"curtesy": 220,
"bio": 100,
"six": 795,
"connected": 184,
"coming": 174,
"related": 725,
"crisis": 214,
"three": 888,
"years": 990,
"bonus": 110,
"surprise": 856,
"wait": 945,
"tell": 873,
"indoctrination": 446,
"article": 66,
"prepare": 674,
"temporary": 876,
"quick": 702,
"6000": 23,
"worth": 984,
"downloadable": 260,
"printable": 678,
"books": 112,
"courses": 205,
"50": 20,
"deal": 233,
"gimmicks": 366,
"help": 409,
"community": 178,
"check": 162,
"never": 584,
"anything": 60,
"iike": 436,
"lifetime": 497,
"worry": 981,
"future": 354,
"wef": 962,
"eat": 266,
"bugs": 125,
"meat": 547,
"everything": 295,
"unfolding": 918,
"2020": 6,
"would": 985,
"ever": 293,
"bundle": 131,
"start": 822,
"self": 766,
"sufficient": 849,
"stay": 828,
"grateful": 382,
"happened": 397,
"connections": 185,
"knowing": 477,
"ivermectin": 461,
"loved": 516,
"could": 200,
"contact": 190,
"easily": 265,
"meet": 550,
"gone": 377,
"eating": 267,
"crickets": 213,
"skills": 796,
"communities": 177,
"leave": 490,
"matrix": 542,
"www": 986,
"holisticwildandfree": 420,
"offgrid": 603,
"empowering": 278,
"farming": 315,
"documentaries": 252,
"attention": 73,
"posing": 666,
"messages": 557,
"anyone": 59,
"exclusively": 298,
"careful": 145,
"scammers": 755,
"sufficiency": 848,
"exodus": 300,
"system": 863,
"crumble": 217,
"knees": 475,
"leaving": 491,
"imagine": 440,
"saying": 753,
"fu": 349,
"water": 955,
"dirty": 247,
"poisonous": 661,
"solar": 804,
"instead": 450,
"paying": 635,
"corrupt": 199,
"companies": 179,
"step": 831,
"created": 210,
"library": 496,
"download": 259,
"47": 19,
"leading": 487,
"experts": 304,
"uncertain": 915,
"nature": 579,
"grid": 385,
"quit": 703,
"sustainably": 860,
"organic": 611,
"online": 609,
"income": 444,
"nomad": 590,
"living": 506,
"tiny": 893,
"homes": 422,
"sustainable": 859,
"crypto": 218,
"emf": 276,
"prepping": 676,
"homeschooling": 423,
"home": 421,
"birthing": 102,
"common": 175,
"law": 485,
"buy": 132,
"longer": 511,
"launched": 483,
"gardening": 357,
"stead": 830,
"foraging": 338,
"affect": 37,
"content": 191,
"place": 650,
"shit": 777,
"hits": 416,
"fan": 313,
"launches": 484,
"40": 18,
"ebooks": 268,
"18th": 3,
"pulling": 695,
"totally": 898,
"project": 683,
"david": 226,
"avocado": 78,
"wolfe": 974,
"john": 466,
"hancock": 394,
"peggy": 638,
"charles": 160,
"dowding": 258,
"carly": 146,
"rose": 741,
"bergman": 91,
"dr": 261,
"stephen": 832,
"house": 429,
"expedition": 301,
"kombi": 478,
"wild": 969,
"mothering": 569
}
}
}