BERTopic_model / ctfidf_config.json
wizardofchance's picture
Add BERTopic model
ccd8637 verified
{
"ctfidf_model": {
"bm25_weighting": false,
"reduce_frequent_words": false
},
"vectorizer_model": {
"params": {
"analyzer": "word",
"binary": false,
"decode_error": "strict",
"encoding": "utf-8",
"input": "content",
"lowercase": true,
"max_df": 1.0,
"max_features": null,
"min_df": 1,
"ngram_range": [
1,
1
],
"stop_words": "english",
"strip_accents": null,
"token_pattern": "(?u)\\b\\w\\w+\\b",
"vocabulary": null
},
"vocab": {
"turning": 1045,
"practical": 748,
"aspect": 75,
"question": 808,
"proposal": 785,
"prime": 766,
"minister": 620,
"india": 497,
"shri": 932,
"rajiv": 814,
"gandhi": 423,
"ninth": 658,
"summit": 984,
"conference": 208,
"non": 660,
"aligned": 51,
"countries": 245,
"held": 458,
"belgrade": 109,
"september": 919,
"creation": 250,
"planet": 725,
"protection": 792,
"fund": 419,
"ppf": 747,
"received": 823,
"wide": 1109,
"attention": 92,
"support": 986,
"particularly": 704,
"encouraged": 343,
"extended": 371,
"president": 757,
"vassiliou": 1082,
"cyprus": 258,
"brundtland": 129,
"norway": 662,
"envisages": 355,
"developing": 288,
"developed": 287,
"contribute": 233,
"used": 1078,
"protect": 790,
"environment": 353,
"purchasing": 799,
"conservation": 217,
"compatible": 188,
"technologies": 1003,
"critical": 253,
"areas": 68,
"brought": 128,
"public": 797,
"domain": 316,
"benefit": 110,
"view": 1088,
"sine": 940,
"qua": 805,
"arriving": 73,
"global": 434,
"compact": 187,
"combating": 178,
"environmental": 354,
"degradation": 269,
"hope": 466,
"general": 426,
"assembly": 78,
"able": 16,
"lend": 565,
"delegation": 270,
"warmly": 1099,
"welcomes": 1106,
"assumption": 83,
"ambassador": 53,
"garba": 424,
"stewardship": 967,
"fourth": 406,
"session": 924,
"eminent": 341,
"personality": 722,
"distinguished": 310,
"representative": 866,
"country": 246,
"friendliest": 415,
"relations": 851,
"confident": 210,
"known": 547,
"diplomatic": 298,
"skill": 942,
"experience": 369,
"deliberations": 271,
"fruitful": 416,
"purposive": 802,
"admire": 31,
"sure": 989,
"touch": 1023,
"assurance": 84,
"promptness": 783,
"secretary": 909,
"mr": 632,
"perez": 719,
"cuellar": 255,
"discharging": 303,
"onerous": 674,
"aid": 47,
"growing": 443,
"responsibilities": 880,
"entrusted": 352,
"united": 1065,
"nations": 644,
"displayed": 309,
"quiet": 809,
"competence": 189,
"remarkable": 859,
"insight": 511,
"organization": 688,
"great": 437,
"potentialities": 743,
"limitations": 577,
"referred": 835,
"report": 864,
"renewal": 862,
"confidence": 209,
"multilateralism": 634,
"44": 13,
"today": 1019,
"longer": 585,
"ideal": 472,
"necessity": 646,
"ultimate": 1046,
"validity": 1080,
"driven": 320,
"home": 465,
"threat": 1015,
"posed": 739,
"human": 471,
"survival": 991,
"nuclear": 666,
"arms": 70,
"race": 810,
"military": 618,
"threats": 1017,
"security": 912,
"poverty": 744,
"underdevelopment": 1050,
"population": 738,
"inequality": 504,
"linchpin": 578,
"strengthened": 971,
"scope": 906,
"universal": 1067,
"membership": 610,
"mandated": 599,
"treaty": 1034,
"form": 400,
"chatter": 161,
"renewed": 863,
"major": 593,
"powers": 746,
"partial": 702,
"selective": 914,
"total": 1021,
"embracing": 337,
"unfortunate": 1059,
"assert": 79,
"rightful": 894,
"role": 896,
"political": 735,
"field": 384,
"regarded": 839,
"economic": 325,
"appropriate": 64,
"forum": 403,
"negotiations": 654,
"issues": 538,
"sincerely": 939,
"hopes": 467,
"imbalance": 476,
"soon": 946,
"redressed": 833,
"ongoing": 675,
"process": 776,
"formulation": 401,
"international": 526,
"development": 289,
"strategy": 970,
"1990s": 9,
"forthcoming": 402,
"special": 952,
"devoted": 292,
"operation": 678,
"provide": 794,
"excellent": 361,
"opportunity": 682,
"concerned": 197,
"blood": 117,
"bath": 105,
"afghanistan": 37,
"continued": 230,
"soviet": 950,
"union": 1064,
"completed": 190,
"withdrawal": 1115,
"troops": 1037,
"schedule": 903,
"parties": 705,
"observe": 669,
"strictly": 974,
"implement": 481,
"geneva": 428,
"accords": 18,
"letter": 568,
"spirit": 955,
"futile": 421,
"search": 908,
"solution": 944,
"come": 179,
"negotiating": 652,
"table": 993,
"trying": 1043,
"resolve": 873,
"means": 606,
"ate": 87,
"prolonging": 781,
"agony": 44,
"people": 717,
"najibullah": 637,
"recently": 825,
"series": 920,
"far": 380,
"reaching": 819,
"proposals": 786,
"national": 643,
"reconciliation": 830,
"opinion": 680,
"deserve": 277,
"consideration": 218,
"maintained": 592,
"traditionally": 1026,
"close": 170,
"iran": 533,
"iraq": 534,
"dismayed": 308,
"lack": 550,
"progress": 779,
"translating": 1031,
"cease": 148,
"agreed": 45,
"year": 1120,
"durable": 323,
"peace": 713,
"supports": 988,
"efforts": 329,
"secure": 911,
"implementation": 482,
"council": 244,
"resolution": 872,
"598": 15,
"1987": 6,
"help": 459,
"vexatious": 1085,
"optimistic": 686,
"note": 664,
"struck": 977,
"regarding": 840,
"prospects": 789,
"resolving": 875,
"long": 584,
"standing": 960,
"problem": 774,
"basis": 104,
"sovereignty": 949,
"unity": 1066,
"territorial": 1011,
"integrity": 519,
"urge": 1073,
"redouble": 832,
"advantage": 33,
"present": 754,
"propitious": 784,
"climate": 168,
"korean": 549,
"peninsula": 716,
"unhappily": 1061,
"remains": 858,
"divided": 313,
"overwhelming": 695,
"sentiment": 918,
"favour": 381,
"dialogue": 293,
"aimed": 50,
"peaceful": 714,
"reunification": 889,
"korea": 548,
"conformity": 212,
"principle": 768,
"universality": 1068,
"aspirations": 77,
"actively": 24,
"realization": 822,
"purposes": 801,
"principles": 769,
"representation": 865,
"world": 1119,
"body": 118,
"recent": 824,
"breakthrough": 124,
"crucial": 254,
"aspects": 76,
"framework": 409,
"strategic": 969,
"reduction": 834,
"talks": 998,
"start": 961,
"welcome": 1105,
"relief": 854,
"brightened": 125,
"early": 324,
"conclusion": 201,
"essential": 359,
"agreement": 46,
"clinched": 169,
"loss": 587,
"momentum": 623,
"meantime": 607,
"moves": 630,
"apace": 59,
"sign": 934,
"let": 567,
"weapons": 1103,
"testing": 1014,
"goes": 435,
"unchecked": 1048,
"does": 315,
"new": 657,
"systems": 992,
"modernization": 622,
"existing": 366,
"weapon": 1102,
"particle": 703,
"beams": 106,
"stealth": 966,
"bombers": 120,
"smart": 943,
"missiles": 621,
"hardly": 451,
"going": 436,
"inspire": 512,
"large": 553,
"interlocutors": 524,
"developments": 291,
"tend": 1006,
"confirm": 211,
"basic": 103,
"apprehensions": 62,
"qualitative": 806,
"clearly": 167,
"monitoring": 624,
"scientific": 905,
"technological": 1002,
"bearing": 107,
"considerations": 219,
"disarmament": 301,
"presented": 755,
"action": 22,
"plan": 724,
"elimination": 336,
"2010": 11,
"states": 964,
"initiate": 506,
"necessary": 645,
"multilateral": 633,
"overall": 694,
"aim": 49,
"moving": 631,
"free": 411,
"violent": 1092,
"past": 708,
"years": 1121,
"community": 186,
"pressing": 759,
"comprehensive": 194,
"chemical": 162,
"convention": 236,
"reached": 818,
"statements": 963,
"week": 1104,
"bush": 132,
"foreign": 398,
"shevardnadze": 931,
"doubt": 317,
"facilitate": 374,
"outstanding": 693,
"resolved": 874,
"signed": 935,
"1990": 8,
"witnessed": 1116,
"cancerous": 140,
"growth": 444,
"terrorism": 1012,
"levels": 570,
"measures": 608,
"discourage": 304,
"terrorist": 1013,
"acts": 25,
"taking": 997,
"innocent": 509,
"men": 611,
"women": 1117,
"hostages": 469,
"awareness": 96,
"menace": 612,
"translated": 1030,
"concrete": 202,
"actions": 23,
"curb": 256,
"like": 576,
"pay": 711,
"tribute": 1036,
"friend": 414,
"dante": 260,
"caputo": 142,
"leadership": 559,
"provided": 795,
"1989": 7,
"consolidation": 220,
"enhanced": 348,
"affairs": 35,
"keeping": 546,
"observation": 668,
"teams": 1001,
"troubled": 1038,
"regions": 847,
"creditably": 252,
"functions": 418,
"contribution": 234,
"recognized": 828,
"merited": 614,
"award": 95,
"nobel": 659,
"prize": 773,
"forces": 396,
"closed": 171,
"optimism": 685,
"palestinian": 700,
"bold": 119,
"courageous": 247,
"initiative": 508,
"arafat": 66,
"initiation": 507,
"palestine": 699,
"liberation": 572,
"created": 249,
"positive": 740,
"situation": 941,
"deadlocked": 263,
"intifadah": 529,
"unarmed": 1047,
"struggle": 979,
"continues": 231,
"amidst": 56,
"increasing": 492,
"repression": 868,
"west": 1107,
"asia": 74,
"just": 545,
"settlement": 926,
"based": 102,
"inalienable": 487,
"right": 893,
"self": 915,
"determination": 283,
"recognition": 826,
"rights": 895,
"region": 843,
"including": 489,
"israel": 537,
"live": 582,
"internationally": 527,
"borders": 121,
"convinced": 238,
"purpose": 800,
"sponsored": 957,
"needs": 649,
"convened": 235,
"urgently": 1075,
"civil": 164,
"strife": 975,
"lebanon": 562,
"fractured": 407,
"constitutional": 224,
"success": 981,
"latest": 556,
"effort": 328,
"high": 462,
"level": 569,
"committee": 183,
"arab": 65,
"league": 561,
"bringing": 127,
"glimmer": 433,
"horizon": 468,
"current": 257,
"lead": 557,
"stability": 958,
"return": 888,
"months": 626,
"ago": 43,
"paris": 701,
"raised": 813,
"future": 422,
"cambodia": 136,
"significant": 936,
"elements": 334,
"package": 697,
"differences": 294,
"persisted": 721,
"cambodian": 137,
"factions": 376,
"resulting": 887,
"aiding": 48,
"making": 596,
"completion": 191,
"vietnamese": 1087,
"adapt": 26,
"balanced": 100,
"approach": 63,
"takes": 996,
"account": 19,
"reality": 821,
"prevailing": 762,
"interests": 522,
"provides": 796,
"cessation": 154,
"interference": 523,
"intervention": 528,
"internal": 525,
"exercise": 364,
"determine": 284,
"destiny": 282,
"equally": 357,
"important": 485,
"ensure": 350,
"costs": 243,
"prevented": 764,
"victim": 1086,
"universally": 1069,
"condemned": 203,
"genocidal": 429,
"policies": 734,
"practices": 750,
"pol": 733,
"pot": 742,
"regime": 841,
"danger": 259,
"recurrence": 831,
"fighting": 386,
"signs": 938,
"visible": 1094,
"arrested": 72,
"imperative": 480,
"need": 647,
"supplies": 985,
"meaningful": 605,
"achieving": 21,
"proliferation": 780,
"true": 1039,
"sense": 917,
"term": 1009,
"unless": 1071,
"doctrines": 314,
"deterrence": 286,
"underpin": 1053,
"discarded": 302,
"root": 897,
"dithering": 312,
"prospect": 788,
"real": 820,
"release": 852,
"resources": 876,
"sector": 910,
"utilized": 1079,
"involved": 531,
"bring": 126,
"economy": 327,
"conscious": 214,
"pert": 723,
"needed": 648,
"institutional": 513,
"arrangements": 71,
"giving": 432,
"shape": 929,
"link": 580,
"opportunities": 681,
"harnessed": 452,
"direction": 299,
"speak": 951,
"capacity": 141,
"mind": 619,
"inevitably": 505,
"date": 261,
"month": 625,
"14": 1,
"november": 665,
"day": 262,
"100": 0,
"1889": 2,
"indian": 498,
"born": 122,
"jawaharlal": 540,
"nehru": 655,
"riches": 892,
"sacrificed": 900,
"join": 542,
"freedom": 412,
"1947": 3,
"mantle": 601,
"leading": 560,
"independent": 496,
"fell": 383,
"having": 455,
"atrocities": 89,
"indignities": 499,
"heaped": 456,
"man": 597,
"imbibed": 478,
"lesson": 566,
"truth": 1041,
"violence": 1091,
"mentor": 613,
"mahatma": 590,
"emerged": 338,
"vision": 1095,
"different": 295,
"conventional": 237,
"wisdom": 1112,
"spoke": 956,
"moral": 628,
"force": 395,
"alignment": 52,
"bloc": 116,
"politics": 736,
"pulled": 798,
"asunder": 85,
"beginning": 108,
"lone": 583,
"voice": 1097,
"association": 82,
"tito": 1018,
"nasser": 642,
"leaders": 558,
"led": 563,
"birth": 115,
"movement": 629,
"vast": 1083,
"majority": 594,
"members": 609,
"outside": 692,
"recognize": 827,
"seek": 913,
"associate": 81,
"age": 40,
"old": 673,
"message": 615,
"precious": 751,
"heritage": 460,
"civilizations": 165,
"rescinded": 870,
"nan": 640,
"happened": 448,
"coincide": 174,
"centenary": 150,
"conclude": 200,
"gave": 425,
"33": 12,
"said": 902,
"peoples": 718,
"passionately": 707,
"desirous": 280,
"desire": 278,
"war": 1098,
"certainly": 153,
"common": 185,
"desires": 279,
"follow": 393,
"path": 709,
"away": 97,
"fears": 382,
"hatred": 453,
"happy": 449,
"central": 151,
"america": 54,
"called": 134,
"play": 729,
"american": 55,
"directly": 300,
"problems": 775,
"besetting": 112,
"compliments": 193,
"statesmanship": 965,
"foresight": 399,
"wish": 1113,
"implementing": 483,
"esquipulas": 358,
"tela": 1005,
"collective": 176,
"bid": 114,
"restore": 882,
"revitalize": 890,
"north": 661,
"south": 947,
"mutuality": 635,
"presidents": 758,
"egypt": 330,
"venezuela": 1084,
"senegal": 916,
"took": 1020,
"july": 544,
"commencement": 180,
"consultations": 226,
"industrialized": 502,
"france": 410,
"canada": 138,
"responded": 878,
"positively": 741,
"response": 879,
"reliance": 853,
"constitutes": 222,
"principal": 767,
"plank": 726,
"platform": 728,
"arid": 69,
"unfortunately": 1060,
"lagged": 552,
"expectations": 368,
"determined": 285,
"backed": 98,
"highest": 464,
"required": 869,
"look": 586,
"forward": 405,
"recommendations": 829,
"commission": 182,
"subject": 980,
"surged": 990,
"forefront": 397,
"concern": 196,
"items": 539,
"agenda": 41,
"end": 345,
"prepare": 753,
"proposed": 787,
"1992": 10,
"strongly": 976,
"solving": 945,
"closely": 172,
"related": 850,
"viewed": 1089,
"isolation": 536,
"stockholm": 968,
"1972": 4,
"shrineti": 933,
"indira": 500,
"characterizing": 159,
"greatest": 439,
"pollutant": 737,
"area": 67,
"consensus": 215,
"unifying": 1062,
"remain": 856,
"happen": 447,
"legitimate": 564,
"concerns": 198,
"addressed": 28,
"adequately": 29,
"endeavour": 346,
"tackle": 994,
"deal": 264,
"attempt": 91,
"freeze": 413,
"unequal": 1056,
"predicament": 752,
"responsibility": 881,
"corrective": 242,
"apart": 60,
"fact": 375,
"wherewithal": 1108,
"financial": 389,
"tendency": 1007,
"rely": 855,
"regulatory": 849,
"fully": 417,
"asymmetries": 86,
"industrialization": 501,
"point": 730,
"supportive": 987,
"enable": 342,
"compromising": 195,
"priorities": 770,
"greater": 438,
"importance": 484,
"generation": 427,
"cope": 239,
"rapid": 815,
"changes": 157,
"pattern": 710,
"production": 778,
"consumption": 227,
"trade": 1024,
"revolution": 891,
"integrationist": 518,
"trends": 1035,
"optimising": 684,
"benefits": 111,
"evolve": 360,
"rules": 899,
"regulations": 848,
"regimes": 842,
"fields": 385,
"manufactures": 602,
"services": 922,
"science": 904,
"technology": 1004,
"uruguay": 1077,
"round": 898,
"address": 27,
"distortions": 311,
"trading": 1025,
"preserving": 756,
"strengthening": 972,
"emerging": 340,
"imbalances": 477,
"inadequate": 486,
"priority": 771,
"given": 431,
"pressures": 760,
"undertake": 1054,
"obligations": 667,
"developmental": 290,
"taken": 995,
"removal": 860,
"barriers": 101,
"transfer": 1028,
"restrictive": 885,
"business": 133,
"followed": 394,
"transnational": 1032,
"corporations": 241,
"specific": 953,
"promotion": 782,
"service": 921,
"industries": 503,
"partners": 706,
"adopt": 32,
"unilateral": 1063,
"coercive": 173,
"penetrate": 715,
"markets": 603,
"liberalization": 571,
"unjust": 1070,
"irrational": 535,
"conducive": 206,
"ma": 589,
"jot": 543,
"undertaking": 1055,
"centres": 152,
"power": 745,
"focal": 392,
"points": 732,
"regional": 844,
"integration": 517,
"regionalism": 845,
"vivisection": 1096,
"answers": 57,
"complex": 192,
"lie": 573,
"narrow": 641,
"havens": 454,
"regionally": 846,
"integrated": 516,
"larger": 554,
"harbour": 450,
"truly": 1040,
"exchanges": 362,
"interactions": 521,
"drug": 321,
"abuse": 17,
"illicit": 475,
"trafficking": 1027,
"drugs": 322,
"scourge": 907,
"corn": 240,
"try": 1042,
"immune": 479,
"consequently": 216,
"entire": 351,
"operate": 677,
"urgent": 1074,
"task": 1000,
"connection": 213,
"colombia": 177,
"calling": 135,
"lies": 574,
"namibian": 639,
"awaited": 94,
"independence": 495,
"undergone": 1052,
"suffering": 982,
"heroic": 461,
"sacrifices": 901,
"way": 1101,
"transition": 1029,
"assistance": 80,
"group": 441,
"guidance": 445,
"creditable": 251,
"job": 541,
"conditions": 205,
"strewn": 973,
"obstacles": 670,
"conduct": 207,
"fair": 378,
"elections": 333,
"vigilance": 1090,
"caution": 147,
"exercised": 365,
"lacunae": 551,
"election": 332,
"identified": 473,
"speedily": 954,
"removed": 861,
"constituent": 221,
"sovereign": 948,
"unfettered": 1058,
"frame": 408,
"constitution": 223,
"set": 925,
"outcome": 690,
"reflects": 836,
"wishes": 1114,
"namibia": 638,
"signify": 937,
"african": 39,
"illegal": 474,
"occupation": 671,
"citadel": 163,
"apartheid": 61,
"africa": 38,
"intact": 515,
"claims": 166,
"matte": 604,
"racial": 811,
"atmosphere": 88,
"undergoing": 1051,
"change": 156,
"watching": 1100,
"carefully": 143,
"quality": 807,
"extent": 372,
"pace": 696,
"willing": 1110,
"reformed": 837,
"totally": 1022,
"dismantled": 307,
"half": 446,
"house": 470,
"restoring": 883,
"dignity": 297,
"protecting": 791,
"demonstrate": 274,
"willingness": 1111,
"negotiate": 650,
"unconditionally": 1049,
"genuine": 430,
"representatives": 867,
"order": 687,
"create": 248,
"suitable": 983,
"negotiation": 653,
"nelson": 656,
"mandela": 600,
"prisoners": 772,
"lift": 575,
"restrictions": 884,
"organizations": 689,
"state": 962,
"emergency": 339,
"line": 579,
"intimidation": 530,
"equality": 356,
"enshrined": 349,
"charter": 160,
"oppose": 683,
"discrimination": 305,
"practiced": 749,
"fiji": 387,
"institutionalise": 514,
"continuing": 232,
"resistance": 871,
"inquiry": 510,
"advisory": 34,
"little": 581,
"eliminate": 335,
"racially": 812,
"discriminatory": 306,
"character": 158,
"draft": 318,
"zealand": 1122,
"pointed": 731,
"failed": 377,
"departure": 276,
"fundamental": 420,
"democratic": 273,
"better": 113,
"prevail": 761,
"late": 555,
"myanmar": 636,
"unstable": 1072,
"result": 886,
"burmese": 131,
"authorities": 93,
"respond": 877,
"urging": 1076,
"democracy": 272,
"work": 1118,
"tensions": 1008,
"met": 616,
"encouraging": 344,
"expansion": 367,
"output": 691,
"external": 373,
"unfavourable": 1057,
"official": 672,
"stagnating": 959,
"terms": 1010,
"target": 999,
"cent": 149,
"gross": 440,
"product": 777,
"flows": 391,
"commercial": 181,
"virtually": 1093,
"dried": 319,
"1980s": 5,
"commodity": 184,
"prices": 765,
"remained": 857,
"lowest": 588,
"50": 14,
"protectionism": 793,
"constrain": 225,
"increase": 490,
"exports": 370,
"decisions": 267,
"affect": 36,
"continue": 229,
"forums": 404,
"exclude": 363,
"carrying": 144,
"structural": 978,
"adjustments": 30,
"economies": 326,
"interact": 520,
"mainstream": 591,
"performed": 720,
"context": 228,
"open": 676,
"operative": 679,
"challenge": 155,
"higher": 463,
"shared": 930,
"groups": 442,
"debt": 265,
"shackling": 928,
"heavily": 457,
"indebted": 493,
"regard": 838,
"various": 1081,
"plans": 727,
"mooted": 627,
"cases": 145,
"notably": 663,
"mexico": 617,
"elaborate": 331,
"packages": 698,
"involving": 532,
"cancellation": 139,
"debts": 266,
"negotiated": 651,
"make": 595,
"dent": 275,
"indebtedness": 494,
"putting": 804,
"conditionalities": 204,
"attached": 90,
"threatens": 1016,
"engulf": 347,
"despite": 281,
"severe": 927,
"difficulties": 296,
"managed": 598,
"balance": 99,
"payments": 712,
"accounts": 20,
"ratio": 817,
"increased": 491,
"rapidly": 816,
"coincided": 175,
"decline": 268,
"concessional": 199,
"pushed": 803,
"borrowings": 123,
"turn": 1044,
"aggravated": 42,
"servicing": 923,
"burden": 130,
"include": 488,
"anticipatory": 58,
"prevent": 763,
"category": 146,
"falling": 379,
"trap": 1033,
"flow": 390,
"finance": 388
}
}
}