-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathMakefile
38 lines (30 loc) · 1.38 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
uv:
@echo "$(GREEN)Setting up UV environment...$(NC)"
@bash setup.sh
download:
wget --content-disposition https://api.ngc.nvidia.com/v2/resources/nvidia/ngc-apps/ngc_cli/versions/3.58.0/files/ngccli_linux.zip -O ngccli_linux.zip && unzip -o ngccli_linux.zip
if [ -z "$$NGC_CLI_API_KEY" ]; then \
echo "NGC_CLI_API_KEY environment variable is not set. Please set this environment variable and run again."; \
exit 1; \
else \
echo "NGC_CLI_API_KEY environment variable is set."; \
fi
ngc-cli/ngc registry model download-version "nvidia/nemo/prompt-task-and-complexity-classifier:task-llm-router"
ngc-cli/ngc registry model download-version "nvidia/nemo/prompt-task-and-complexity-classifier:complexity-llm-router"
cp -r prompt-task-and-complexity-classifier_vtask-llm-router/* routers/
cp -r prompt-task-and-complexity-classifier_vcomplexity-llm-router/* routers/
echo "Models downloaded and stored in routers directory successfully."
up:
docker compose up router-server router-controller --build -d
down:
docker compose -f docker-compose.yaml down -v
app:
docker compose up app --build -d
echo "Visit the app at localhost:8008"
metrics:
docker compose up grafana --build -d
echo "Prometheus is running on 9090. Grafana is 3000 with user: admin and password: secret"
loadtest:
docker compose up locust --build -d
build-router:
docker compose up router-builder --build -d