thepolymerguy commited on
Commit
e450f6c
·
1 Parent(s): 2b64787

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -17,7 +17,7 @@ model = LlamaForCausalLM.from_pretrained(
17
  load_in_8bit=True,
18
  device_map="auto") #low_cpu_mem_usage=True)
19
 
20
- #model = model.to('cuda')
21
 
22
 
23
  def add_text(history, text):
@@ -68,7 +68,7 @@ def generateresponse(history, task):
68
  PROMPT,
69
  return_tensors="pt",
70
  )
71
- input_ids = inputs["input_ids"]#.cuda()
72
 
73
  generation_config = GenerationConfig(
74
  temperature=0.6,
 
17
  load_in_8bit=True,
18
  device_map="auto") #low_cpu_mem_usage=True)
19
 
20
+ model = model.to('cuda')
21
 
22
 
23
  def add_text(history, text):
 
68
  PROMPT,
69
  return_tensors="pt",
70
  )
71
+ input_ids = inputs["input_ids"].cuda()
72
 
73
  generation_config = GenerationConfig(
74
  temperature=0.6,