Update handler.py
Browse files- handler.py +3 -0
handler.py
CHANGED
@@ -1,6 +1,9 @@
|
|
1 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
2 |
import torch
|
3 |
|
|
|
|
|
|
|
4 |
class CustomModelHandler:
|
5 |
def __init__(self, model_name_or_path: str):
|
6 |
self.model_name_or_path = model_name_or_path
|
|
|
1 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
2 |
import torch
|
3 |
|
4 |
+
import subprocess
|
5 |
+
subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
|
6 |
+
|
7 |
class CustomModelHandler:
|
8 |
def __init__(self, model_name_or_path: str):
|
9 |
self.model_name_or_path = model_name_or_path
|