mnauf commited on
Commit
0a57ca5
·
1 Parent(s): b98d5cd

first commit

Browse files
Files changed (2) hide show
  1. app.py +2 -2
  2. sample.py +2 -2
app.py CHANGED
@@ -49,5 +49,5 @@ with gr.Blocks() as block:
49
  outputs=outputs,
50
  queue=True
51
  )
52
- block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
53
- # block.queue().launch()
 
49
  outputs=outputs,
50
  queue=True
51
  )
52
+ # block.queue(concurrency_count=5).launch(server_name="localhost", share=True)
53
+ block.queue().launch()
sample.py CHANGED
@@ -17,9 +17,9 @@ max_new_tokens = 500 # number of tokens generated in each sample
17
  temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
18
  top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
19
  seed = 1337
20
- device = 'cuda' # examples: 'cpu', 'cuda', 'cuda:0', 'cuda:1', etc.
21
  dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
22
- compile = False # use PyTorch 2.0 to compile the model to be faster
23
  exec(open('configurator.py').read()) # overrides from command line or config file
24
  # -----------------------------------------------------------------------------
25
 
 
17
  temperature = 0.8 # 1.0 = no change, < 1.0 = less random, > 1.0 = more random, in predictions
18
  top_k = 200 # retain only the top_k most likely tokens, clamp others to have 0 probability
19
  seed = 1337
20
+ device = 'cpu' # examples: 'cpu', 'cuda', 'cuda:0', 'cuda:1', etc.
21
  dtype = 'bfloat16' # 'float32' or 'bfloat16' or 'float16'
22
+ compile = True # use PyTorch 2.0 to compile the model to be faster
23
  exec(open('configurator.py').read()) # overrides from command line or config file
24
  # -----------------------------------------------------------------------------
25