Lam-Hung commited on
Commit
d533c0e
1 Parent(s): b32edec

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -18,7 +18,7 @@ device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
18
  model_id = "google/gemma-2-9b-it"
19
  tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
20
 
21
- quantization = BitsAndBytesConfig(load_in_8bit= True)
22
  model = AutoModelForCausalLM.from_pretrained(
23
  model_id,
24
  device_map="auto",
 
18
  model_id = "google/gemma-2-9b-it"
19
  tokenizer = GemmaTokenizerFast.from_pretrained(model_id, token = huggingface_token)
20
 
21
+ quantization = BitsAndBytesConfig(load_in_4bit= True)
22
  model = AutoModelForCausalLM.from_pretrained(
23
  model_id,
24
  device_map="auto",