8 lines
231 B
Plaintext
8 lines
231 B
Plaintext
HF_TOKEN=YOUR_HF_TOKEN_HERE
|
|
VLLM_API_KEY=YOUR_LOCAL_API_KEY_HERE
|
|
GEMMA_MODEL_ID=google/gemma-3-1b-it
|
|
BACKEND_PORT=8000
|
|
HUGGINGFACE_CACHE_DIR=/home/${USER}/.cache/huggingface
|
|
VLLM_MAX_MODEL_LEN=4096
|
|
VLLM_GPU_MEMORY_UTILIZATION=0.88
|