Spaces:

Lam-Hung
/

Japanese_assistant

Runtime error

Lam-Hung commited on Aug 13

Commit

d533c0e

•

1 Parent(s): b32edec

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,7 +18,7 @@ device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 model_id = "google/gemma-2-9b-it"
 tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
-quantization = BitsAndBytesConfig(load_in_8bit= True)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",

 model_id = "google/gemma-2-9b-it"
 tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
+quantization = BitsAndBytesConfig(load_in_4bit= True)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",