update model_worker.py
Browse files- model_worker.py +3 -1
model_worker.py
CHANGED
|
@@ -232,7 +232,9 @@ class ModelWorker:
|
|
| 232 |
except ImportError:
|
| 233 |
|
| 234 |
def install_flash_attn():
|
| 235 |
-
os.system(
|
|
|
|
|
|
|
| 236 |
|
| 237 |
install_flash_attn()
|
| 238 |
# import flash_attn
|
|
|
|
| 232 |
except ImportError:
|
| 233 |
|
| 234 |
def install_flash_attn():
|
| 235 |
+
os.system(
|
| 236 |
+
"FLASH_ATTENTION_SKIP_CUDA_BUILD=TRUE pip install flash-attn==2.5.9.post1 --no-build-isolation"
|
| 237 |
+
)
|
| 238 |
|
| 239 |
install_flash_attn()
|
| 240 |
# import flash_attn
|