feat: add nexa-sdk

This commit is contained in:
Sun-ZhenXing
2025-11-16 00:12:14 +08:00
parent 5f9820e7db
commit 1c42cb2800
9 changed files with 616 additions and 5 deletions

View File

@@ -0,0 +1,41 @@
# Global registry for container images (optional)
# GLOBAL_REGISTRY=
# Nexa SDK version
NEXA_SDK_VERSION=latest
# Timezone configuration
TZ=UTC
# Port override for host binding
NEXA_SDK_PORT_OVERRIDE=8080
# Server configuration
NEXA_HOST=0.0.0.0:8080
NEXA_KEEPALIVE=300
NEXA_ORIGINS=*
# HuggingFace token for accessing private models (optional)
NEXA_HFTOKEN=
# Logging level (none, debug, info, warn, error)
NEXA_LOG=none
# Model to run (can be any Nexa-compatible model)
# Examples: gemma-2-2b-instruct, qwen3-4b, llama-3-8b, mistral-7b
NEXA_MODEL=gemma-2-2b-instruct
# GPU configuration (for gpu profile only)
# Number of GPU layers to offload (-1 for all layers)
NEXA_GPU_LAYERS=-1
# Shared memory size
NEXA_SHM_SIZE=2g
# Resource limits
NEXA_SDK_CPU_LIMIT=4.0
NEXA_SDK_MEMORY_LIMIT=8G
# Resource reservations
NEXA_SDK_CPU_RESERVATION=2.0
NEXA_SDK_MEMORY_RESERVATION=4G