TheBloke
/

BLOOMChat-176B-v1-GPTQ

Text Generation

text-generation-inference

Model card Files Files and versions Community

TheBloke commited on Jul 6, 2023

Commit

92ae604

•

1 Parent(s): 80444cb

Update README.md

Files changed (1) hide show

README.md +4 -4

README.md CHANGED Viewed

@@ -134,15 +134,15 @@ tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True)
 model = AutoGPTQForCausalLM.from_quantized(model_name_or_path,
         model_basename=model_basename,
         use_safetensors=True,
         trust_remote_code=False,
-        device="cuda:0",
         use_triton=use_triton,
         quantize_config=None)
-prompt = "Translate this to French: AI is the future of computing"
-prompt_template=f'''{prompt}
-Translation:
 '''
 print("\n\n*** Generate:")

 model = AutoGPTQForCausalLM.from_quantized(model_name_or_path,
         model_basename=model_basename,
+        max_memory={0: '60GiB', 1: '79GiB'} # max_memory is for 2 x 80GB GPUs; adjust if your config is different!
         use_safetensors=True,
         trust_remote_code=False,
         use_triton=use_triton,
         quantize_config=None)
+prompt = "Write a story about llamas"
+prompt_template=f'''<human>: {prompt}
+<bot>:
 '''
 print("\n\n*** Generate:")