Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -18,7 +18,7 @@ device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
|
|
18 |
model_id = "google/gemma-2-9b-it"
|
19 |
tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
|
20 |
|
21 |
-
quantization = BitsAndBytesConfig(
|
22 |
model = AutoModelForCausalLM.from_pretrained(
|
23 |
model_id,
|
24 |
device_map="auto",
|
|
|
18 |
model_id = "google/gemma-2-9b-it"
|
19 |
tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
|
20 |
|
21 |
+
quantization = BitsAndBytesConfig(load_in_4bit= True)
|
22 |
model = AutoModelForCausalLM.from_pretrained(
|
23 |
model_id,
|
24 |
device_map="auto",
|