Spaces:
Running
on
Zero
Running
on
Zero
Feature(MInference): install pycuda
Browse files
app.py
CHANGED
@@ -81,12 +81,12 @@ def chat_llama3_8b(message: str,
|
|
81 |
str: The generated response.
|
82 |
"""
|
83 |
global model
|
|
|
|
|
|
|
|
|
84 |
if "has_patch" not in model.__dict__:
|
85 |
from minference import MInference
|
86 |
-
subprocess.run(
|
87 |
-
"pip install pycuda==2023.1",
|
88 |
-
shell=True,
|
89 |
-
)
|
90 |
minference_patch = MInference("minference", model_name)
|
91 |
model = minference_patch(model)
|
92 |
conversation = []
|
|
|
81 |
str: The generated response.
|
82 |
"""
|
83 |
global model
|
84 |
+
subprocess.run(
|
85 |
+
"pip install pycuda==2023.1",
|
86 |
+
shell=True,
|
87 |
+
)
|
88 |
if "has_patch" not in model.__dict__:
|
89 |
from minference import MInference
|
|
|
|
|
|
|
|
|
90 |
minference_patch = MInference("minference", model_name)
|
91 |
model = minference_patch(model)
|
92 |
conversation = []
|