Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -389,7 +389,7 @@ else:
|
|
| 389 |
# )quantization_config = nf4_config,
|
| 390 |
|
| 391 |
tokenizer = AutoTokenizer.from_pretrained("google/gemma-2b-it", token=HF_TOKEN)
|
| 392 |
-
model = AutoModelForCausalLM.from_pretrained("google/gemma-2b-it",
|
| 393 |
|
| 394 |
|
| 395 |
def make_inference(query, hist):
|
|
|
|
| 389 |
# )quantization_config = nf4_config,
|
| 390 |
|
| 391 |
tokenizer = AutoTokenizer.from_pretrained("google/gemma-2b-it", token=HF_TOKEN)
|
| 392 |
+
model = AutoModelForCausalLM.from_pretrained("google/gemma-2b-it", device_map="auto", torch_dtype=torch.bfloat16, token=HF_TOKEN)
|
| 393 |
|
| 394 |
|
| 395 |
def make_inference(query, hist):
|