rkumar70900 commited on
Commit
a504f50
·
verified ·
1 Parent(s): 506e559

updating readme with cuda device

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -50,12 +50,12 @@ import torch
50
  from transformers import AutoModelForCausalLM, AutoTokenizer
51
 
52
  model_id = "rkumar70900/Llama-3.2-3B-Instruct-GPTQ-INT4"
53
- tokenizer = AutoTokenizer.from_pretrained(model_id)
54
  model = AutoModelForCausalLM.from_pretrained(
55
  model_id,
56
  torch_dtype=torch.float16,
57
  low_cpu_mem_usage=True,
58
- device_map="auto",
59
  )
60
 
61
  prompt = [
 
50
  from transformers import AutoModelForCausalLM, AutoTokenizer
51
 
52
  model_id = "rkumar70900/Llama-3.2-3B-Instruct-GPTQ-INT4"
53
+ tokenizer = AutoTokenizer.from_pretrained(model_id, device_map="cuda")
54
  model = AutoModelForCausalLM.from_pretrained(
55
  model_id,
56
  torch_dtype=torch.float16,
57
  low_cpu_mem_usage=True,
58
+ device_map="cuda",
59
  )
60
 
61
  prompt = [