elma-dev commited on
Commit
d616881
·
1 Parent(s): 7977478

change to bf16

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -18,7 +18,7 @@ model = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path,
18
  token = os.environ['TOKEN'],
19
  torch_dtype=torch.bfloat16
20
  )
21
- model = PeftModel.from_pretrained(model,MODEL_NAME)
22
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
23
  if tokenizer.pad_token is None:
24
  tokenizer.pad_token = tokenizer.eos_token
@@ -55,9 +55,9 @@ model_response = gr.Textbox(
55
  rtl=True,
56
  )
57
 
58
- temperature = gr.Slider(minimum=0.0,maximum=1.0,value=0.7, label="Temperature") # Reduced default
59
- top_k = gr.Slider(1, 10000, value=50, label="Top-k") # Reduced default
60
- repetition_penalty = gr.Slider(0.0, 100.0, value=1.2, label="Repetition Penalty") # Reduced default
61
 
62
  demo=gr.Interface(
63
  fn=generate,
 
18
  token = os.environ['TOKEN'],
19
  torch_dtype=torch.bfloat16
20
  )
21
+ model = PeftModel.from_pretrained(model,MODEL_NAME,torch_dtype=torch.bfloat16)
22
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
23
  if tokenizer.pad_token is None:
24
  tokenizer.pad_token = tokenizer.eos_token
 
55
  rtl=True,
56
  )
57
 
58
+ temperature = gr.Slider(minimum=0.01,maximum=1.0,value=0.7, label="Temperature") # Reduced default
59
+ top_k = gr.Slider(1, 10000, value=10, label="Top-k") # Reduced default
60
+ repetition_penalty = gr.Slider(0.1, 100.0, value=1.2, label="Repetition Penalty") # Reduced default
61
 
62
  demo=gr.Interface(
63
  fn=generate,