Spaces:
Runtime error
Runtime error
elma-dev
commited on
Commit
·
d616881
1
Parent(s):
7977478
change to bf16
Browse files
app.py
CHANGED
|
@@ -18,7 +18,7 @@ model = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path,
|
|
| 18 |
token = os.environ['TOKEN'],
|
| 19 |
torch_dtype=torch.bfloat16
|
| 20 |
)
|
| 21 |
-
model = PeftModel.from_pretrained(model,MODEL_NAME)
|
| 22 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
|
| 23 |
if tokenizer.pad_token is None:
|
| 24 |
tokenizer.pad_token = tokenizer.eos_token
|
|
@@ -55,9 +55,9 @@ model_response = gr.Textbox(
|
|
| 55 |
rtl=True,
|
| 56 |
)
|
| 57 |
|
| 58 |
-
temperature = gr.Slider(minimum=0.
|
| 59 |
-
top_k = gr.Slider(1, 10000, value=
|
| 60 |
-
repetition_penalty = gr.Slider(0.
|
| 61 |
|
| 62 |
demo=gr.Interface(
|
| 63 |
fn=generate,
|
|
|
|
| 18 |
token = os.environ['TOKEN'],
|
| 19 |
torch_dtype=torch.bfloat16
|
| 20 |
)
|
| 21 |
+
model = PeftModel.from_pretrained(model,MODEL_NAME,torch_dtype=torch.bfloat16)
|
| 22 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
|
| 23 |
if tokenizer.pad_token is None:
|
| 24 |
tokenizer.pad_token = tokenizer.eos_token
|
|
|
|
| 55 |
rtl=True,
|
| 56 |
)
|
| 57 |
|
| 58 |
+
temperature = gr.Slider(minimum=0.01,maximum=1.0,value=0.7, label="Temperature") # Reduced default
|
| 59 |
+
top_k = gr.Slider(1, 10000, value=10, label="Top-k") # Reduced default
|
| 60 |
+
repetition_penalty = gr.Slider(0.1, 100.0, value=1.2, label="Repetition Penalty") # Reduced default
|
| 61 |
|
| 62 |
demo=gr.Interface(
|
| 63 |
fn=generate,
|