Spaces:
Paused
Paused
Update app.py
Browse filesAdded restriction
app.py
CHANGED
|
@@ -33,6 +33,59 @@ Your responses should only be within the financial subject, any other prompt or
|
|
| 33 |
# MAX_MAX_NEW_TOKENS = 2048
|
| 34 |
# DEFAULT_MAX_NEW_TOKENS = 512
|
| 35 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
model_id = "FOLZi/FinID_v2_8B_Chat"
|
| 37 |
quantization_config = BitsAndBytesConfig(load_in_8bit=True)
|
| 38 |
|
|
@@ -70,6 +123,15 @@ ct_end_token = "<|endoftext|>"
|
|
| 70 |
|
| 71 |
@spaces.GPU()
|
| 72 |
def generate(message, history):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 73 |
history = [] # Disabled history.
|
| 74 |
history_transformer_format = history + [[message, ""]]
|
| 75 |
stop = StopOnTokens()
|
|
|
|
| 33 |
# MAX_MAX_NEW_TOKENS = 2048
|
| 34 |
# DEFAULT_MAX_NEW_TOKENS = 512
|
| 35 |
|
| 36 |
+
restricted_words = [
|
| 37 |
+
# Olahraga & aktivitas fisik
|
| 38 |
+
"olahraga", "sport", "sports", "sepak bola", "football", "basket", "basketball", "voli", "futsal", "renang",
|
| 39 |
+
"bersepeda", "yoga", "fitness", "workout", "gym", "lari", "jogging", "marathon", "bodybuilding",
|
| 40 |
+
|
| 41 |
+
# Hiburan & budaya populer
|
| 42 |
+
"anime", "manga", "komik", "comic", "kartun", "cartoon", "drama", "romance", "horror", "thriller", "action",
|
| 43 |
+
"comedy", "film", "movie", "tv series", "series", "Netflix", "Disney", "HBO", "Amazon Prime", "YouTube",
|
| 44 |
+
"streaming", "idol", "band", "musik", "lagu", "konser", "album", "artis", "aktor", "aktris", "selebritis",
|
| 45 |
+
"selebriti", "gosip", "viral", "trending", "meme", "influencer", "content creator", "tiktok", "vlogger",
|
| 46 |
+
|
| 47 |
+
# Kuliner & makanan
|
| 48 |
+
"makanan", "minuman", "resep", "memasak", "masakan", "masak", "kuliner", "menu", "ayam", "sapi", "ikan",
|
| 49 |
+
"rendang", "sate", "bakso", "mie", "lontong", "nasi goreng", "kue", "jajanan", "kopi", "teh", "es krim",
|
| 50 |
+
|
| 51 |
+
# Hubungan, percintaan, kehidupan pribadi
|
| 52 |
+
"pacaran", "cinta", "romantis", "romansa", "dating", "love", "jodoh", "nikah", "pernikahan", "mantan",
|
| 53 |
+
"crush", "friendzone", "friendship", "persahabatan", "PDA", "perasaan", "emosi",
|
| 54 |
+
|
| 55 |
+
# Fashion, kecantikan & gaya hidup
|
| 56 |
+
"fashion", "baju", "pakaian", "kaos", "celana", "jaket", "sepatu", "tas", "gaya", "OOTD", "skincare",
|
| 57 |
+
"makeup", "lipstik", "kecantikan", "beauty", "perawatan", "spa", "salon",
|
| 58 |
+
|
| 59 |
+
# Teknologi umum & AI
|
| 60 |
+
"AI", "artificial intelligence", "machine learning", "deep learning", "robot", "android", "teknologi",
|
| 61 |
+
"smartphone", "gadget", "gawai", "laptop", "hardware", "software", "game", "gaming", "console", "VR", "AR",
|
| 62 |
+
|
| 63 |
+
# Ilmu pengetahuan umum
|
| 64 |
+
"sains", "science", "astronomi", "planet", "galaksi", "bintang", "meteor", "luar angkasa", "kimia", "biologi",
|
| 65 |
+
"fisika", "matematika", "matematika diskrit", "aljabar", "statistika", "geografi", "sejarah",
|
| 66 |
+
|
| 67 |
+
# Filosofi & agama
|
| 68 |
+
"filsafat", "filosofi", "agama", "teologi", "psikologi", "mitologi", "mythology", "spiritual", "meditasi",
|
| 69 |
+
"karma", "reinkarnasi",
|
| 70 |
+
|
| 71 |
+
# Hukum & kriminalitas
|
| 72 |
+
"hukum", "UU", "undang-undang", "legal", "ilegal", "pengadilan", "hakim", "jaksa", "kriminal", "pencurian",
|
| 73 |
+
"korupsi", "penipuan", "pembunuhan", "kejahatan", "detektif", "penjara", "narkoba", "obat-obatan",
|
| 74 |
+
|
| 75 |
+
# Politik, militer, konflik
|
| 76 |
+
"politik", "partai", "kampanye", "pemilu", "kandidat", "presiden", "dpr", "militer", "tentara", "perang",
|
| 77 |
+
"konflik", "senjata", "roket", "bom", "rudal", "pemberontak", "terorisme",
|
| 78 |
+
|
| 79 |
+
# Alam, hewan, dan lingkungan
|
| 80 |
+
"binatang", "hewan", "anjing", "kucing", "pets", "flora", "fauna", "tumbuhan", "tanaman", "hutan", "alam",
|
| 81 |
+
"kebun", "cuaca", "iklim", "climate", "bencana", "gempa", "banjir", "angin", "sustainability", "green energy",
|
| 82 |
+
|
| 83 |
+
# Lain-lain di luar literasi keuangan
|
| 84 |
+
"astrologi", "zodiak", "ramalan", "santet", "sihir", "mistis", "dongeng", "cerita rakyat", "fantasi", "fiksi",
|
| 85 |
+
"hantu", "alien", "konspirasi", "misteri"
|
| 86 |
+
]
|
| 87 |
+
|
| 88 |
+
|
| 89 |
model_id = "FOLZi/FinID_v2_8B_Chat"
|
| 90 |
quantization_config = BitsAndBytesConfig(load_in_8bit=True)
|
| 91 |
|
|
|
|
| 123 |
|
| 124 |
@spaces.GPU()
|
| 125 |
def generate(message, history):
|
| 126 |
+
|
| 127 |
+
# Pendeteksian via primitif TOO BAD!
|
| 128 |
+
matched_words = [word for word in restricted_words if re.search(rf"\b{word}\b", message, re.IGNORECASE)]
|
| 129 |
+
|
| 130 |
+
# Jika ditemukan, hentikan proses dan kembalikan pesan peringatan
|
| 131 |
+
if matched_words:
|
| 132 |
+
yield "Maaf, saya hanya dapat menjawab pertanyaan yang berkaitan dengan literasi keuangan."
|
| 133 |
+
return
|
| 134 |
+
|
| 135 |
history = [] # Disabled history.
|
| 136 |
history_transformer_format = history + [[message, ""]]
|
| 137 |
stop = StopOnTokens()
|