Spaces:
Running on T4
Running on T4
Update app.py
Browse files
app.py
CHANGED
|
@@ -20,6 +20,7 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
|
| 20 |
|
| 21 |
ctx_limit = 2500
|
| 22 |
gen_limit = 500
|
|
|
|
| 23 |
ENABLE_VISUAL = False
|
| 24 |
|
| 25 |
########################## text rwkv ################################################################
|
|
@@ -32,8 +33,8 @@ model_v6 = RWKV(model=model_path_v6, strategy='cuda fp16')
|
|
| 32 |
pipeline_v6 = PIPELINE(model_v6, "rwkv_vocab_v20230424")
|
| 33 |
|
| 34 |
args = model_v6.args
|
| 35 |
-
eng_name = 'rwkv-x060-eng_single_round_qa-3B-
|
| 36 |
-
chn_name = 'rwkv-x060-chn_single_round_qa-3B-
|
| 37 |
|
| 38 |
# state_eng_raw = torch.load(f'/mnt/e/RWKV-Runner/models/{eng_name}.pth', map_location=torch.device('cpu'))
|
| 39 |
# state_chn_raw = torch.load(f'/mnt/e/RWKV-Runner/models/{chn_name}.pth', map_location=torch.device('cpu'))
|
|
@@ -267,22 +268,22 @@ examples = [
|
|
| 267 |
]
|
| 268 |
|
| 269 |
examples_eng = [
|
| 270 |
-
["How can I craft an engaging story featuring vampires on Mars?",
|
| 271 |
-
["Compare the business models of Apple and Google.",
|
| 272 |
-
["In JSON format, list the top 5 tourist attractions in Paris.",
|
| 273 |
-
["Write an outline for a fantasy novel where dreams can alter reality.",
|
| 274 |
-
["Can fish get thirsty?",
|
| 275 |
-
["Write a Bash script to check disk usage and send alerts if it's too high.",
|
| 276 |
-
["Write a simple website in HTML. When a user clicks the button, it shows a random joke from a list of 4 jokes.",
|
| 277 |
]
|
| 278 |
|
| 279 |
examples_chn = [
|
| 280 |
-
["怎样写一个在火星上的吸血鬼的有趣故事?",
|
| 281 |
-
["比较苹果和谷歌的商业模式。",
|
| 282 |
-
["鱼会口渴吗?",
|
| 283 |
-
["以 JSON 格式列举北京的美食。",
|
| 284 |
-
["编写一个Bash脚本来检查磁盘使用情况,如果使用量过高则发送警报。",
|
| 285 |
-
["用HTML编写一个简单的网站。当用户点击按钮时,从4个笑话的列表中随机显示一个笑话。",
|
| 286 |
]
|
| 287 |
|
| 288 |
if ENABLE_VISUAL:
|
|
@@ -450,7 +451,7 @@ with gr.Blocks(title=title_v6) as demo:
|
|
| 450 |
with gr.Row():
|
| 451 |
with gr.Column():
|
| 452 |
prompt = gr.Textbox(lines=2, label="Prompt", value="How can I craft an engaging story featuring vampires on Mars?")
|
| 453 |
-
token_count = gr.Slider(10,
|
| 454 |
temperature = gr.Slider(0.2, 2.0, label="Temperature", step=0.1, value=1.0)
|
| 455 |
top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.2)
|
| 456 |
presence_penalty = gr.Slider(0.0, 1.0, label="Presence Penalty", step=0.1, value=0.3)
|
|
@@ -470,7 +471,7 @@ with gr.Blocks(title=title_v6) as demo:
|
|
| 470 |
with gr.Row():
|
| 471 |
with gr.Column():
|
| 472 |
prompt = gr.Textbox(lines=2, label="Prompt", value="怎样写一个在火星上的吸血鬼的有趣故事?")
|
| 473 |
-
token_count = gr.Slider(10,
|
| 474 |
temperature = gr.Slider(0.2, 2.0, label="Temperature", step=0.1, value=1.0)
|
| 475 |
top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.2)
|
| 476 |
presence_penalty = gr.Slider(0.0, 1.0, label="Presence Penalty", step=0.1, value=0.3)
|
|
|
|
| 20 |
|
| 21 |
ctx_limit = 2500
|
| 22 |
gen_limit = 500
|
| 23 |
+
gen_limit_long = 800
|
| 24 |
ENABLE_VISUAL = False
|
| 25 |
|
| 26 |
########################## text rwkv ################################################################
|
|
|
|
| 33 |
pipeline_v6 = PIPELINE(model_v6, "rwkv_vocab_v20230424")
|
| 34 |
|
| 35 |
args = model_v6.args
|
| 36 |
+
eng_name = 'rwkv-x060-eng_single_round_qa-3B-20240516-ctx2048'
|
| 37 |
+
chn_name = 'rwkv-x060-chn_single_round_qa-3B-20240516-ctx2048'
|
| 38 |
|
| 39 |
# state_eng_raw = torch.load(f'/mnt/e/RWKV-Runner/models/{eng_name}.pth', map_location=torch.device('cpu'))
|
| 40 |
# state_chn_raw = torch.load(f'/mnt/e/RWKV-Runner/models/{chn_name}.pth', map_location=torch.device('cpu'))
|
|
|
|
| 268 |
]
|
| 269 |
|
| 270 |
examples_eng = [
|
| 271 |
+
["How can I craft an engaging story featuring vampires on Mars?", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 272 |
+
["Compare the business models of Apple and Google.", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 273 |
+
["In JSON format, list the top 5 tourist attractions in Paris.", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 274 |
+
["Write an outline for a fantasy novel where dreams can alter reality.", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 275 |
+
["Can fish get thirsty?", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 276 |
+
["Write a Bash script to check disk usage and send alerts if it's too high.", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 277 |
+
["Write a simple website in HTML. When a user clicks the button, it shows a random joke from a list of 4 jokes.", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 278 |
]
|
| 279 |
|
| 280 |
examples_chn = [
|
| 281 |
+
["怎样写一个在火星上的吸血鬼的有趣故事?", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 282 |
+
["比较苹果和谷歌的商业模式。", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 283 |
+
["鱼会口渴吗?", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 284 |
+
["以 JSON 格式列举北京的美食。", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 285 |
+
["编写一个Bash脚本来检查磁盘使用情况,如果使用量过高则发送警报。", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 286 |
+
["用HTML编写一个简单的网站。当用户点击按钮时,从4个笑话的列表中随机显示一个笑话。", gen_limit_long, 1, 0.2, 0.3, 0.3],
|
| 287 |
]
|
| 288 |
|
| 289 |
if ENABLE_VISUAL:
|
|
|
|
| 451 |
with gr.Row():
|
| 452 |
with gr.Column():
|
| 453 |
prompt = gr.Textbox(lines=2, label="Prompt", value="How can I craft an engaging story featuring vampires on Mars?")
|
| 454 |
+
token_count = gr.Slider(10, gen_limit_long, label="Max Tokens", step=10, value=gen_limit_long)
|
| 455 |
temperature = gr.Slider(0.2, 2.0, label="Temperature", step=0.1, value=1.0)
|
| 456 |
top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.2)
|
| 457 |
presence_penalty = gr.Slider(0.0, 1.0, label="Presence Penalty", step=0.1, value=0.3)
|
|
|
|
| 471 |
with gr.Row():
|
| 472 |
with gr.Column():
|
| 473 |
prompt = gr.Textbox(lines=2, label="Prompt", value="怎样写一个在火星上的吸血鬼的有趣故事?")
|
| 474 |
+
token_count = gr.Slider(10, gen_limit_long, label="Max Tokens", step=10, value=gen_limit_long)
|
| 475 |
temperature = gr.Slider(0.2, 2.0, label="Temperature", step=0.1, value=1.0)
|
| 476 |
top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.2)
|
| 477 |
presence_penalty = gr.Slider(0.0, 1.0, label="Presence Penalty", step=0.1, value=0.3)
|