File size: 122 Bytes
d57e49b
 
 
 
1
2
3
4
5
cd server

DEVICE=cuda:0 ATTN_IMPLEMENTATION=flash_attention_2 ./.venv/bin/uvicorn src.main:app --reload --port 3535
cd -