jerryzh168 commited on
Commit
1585385
·
verified ·
1 Parent(s): 065d479

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -252,7 +252,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer, TorchAoConfig
252
 
253
  # use "microsoft/Phi-4-mini-instruct" or "pytorch/Phi-4-mini-instruct-INT4"
254
  model_id = "pytorch/Phi-4-mini-instruct-INT4"
255
- quantized_model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", torch_dtype=torch.bfloat16)
256
  tokenizer = AutoTokenizer.from_pretrained(model_id)
257
 
258
  torch.cuda.reset_peak_memory_stats()
 
252
 
253
  # use "microsoft/Phi-4-mini-instruct" or "pytorch/Phi-4-mini-instruct-INT4"
254
  model_id = "pytorch/Phi-4-mini-instruct-INT4"
255
+ quantized_model = AutoModelForCausalLM.from_pretrained(model_id, device_map="cuda:0", torch_dtype=torch.bfloat16)
256
  tokenizer = AutoTokenizer.from_pretrained(model_id)
257
 
258
  torch.cuda.reset_peak_memory_stats()