mnauf commited on
Commit ·
0a57ca5
1
Parent(s): b98d5cd
first commit
Browse files
app.py
CHANGED
|
@@ -49,5 +49,5 @@ with gr.Blocks() as block:
|
|
| 49 |
outputs=outputs,
|
| 50 |
queue=True
|
| 51 |
)
|
| 52 |
-
block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
|
| 53 |
-
|
|
|
|
| 49 |
outputs=outputs,
|
| 50 |
queue=True
|
| 51 |
)
|
| 52 |
+
# block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
|
| 53 |
+
block.queue().launch()
|
sample.py
CHANGED
|
@@ -17,9 +17,9 @@ max_new_tokens = 500 # number of tokens generated in each sample
|
|
| 17 |
temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
|
| 18 |
top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
|
| 19 |
seed = 1337
|
| 20 |
-
device = '
|
| 21 |
dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
|
| 22 |
-
compile =
|
| 23 |
exec(open('configurator.py').read()) # overrides from command line or config file
|
| 24 |
# -----------------------------------------------------------------------------
|
| 25 |
|
|
|
|
| 17 |
temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
|
| 18 |
top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
|
| 19 |
seed = 1337
|
| 20 |
+
device = 'cpu' # examples: 'cpu', 'cuda', 'cuda:0', 'cuda:1', etc.
|
| 21 |
dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
|
| 22 |
+
compile = True # use PyTorch 2.0 to compile the model to be faster
|
| 23 |
exec(open('configurator.py').read()) # overrides from command line or config file
|
| 24 |
# -----------------------------------------------------------------------------
|
| 25 |
|