-
Notifications
You must be signed in to change notification settings - Fork 243
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'awslabs:main' into spark-cleanup-fix
- Loading branch information
Showing
18 changed files
with
863 additions
and
43 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,17 @@ | ||
# Use the base image | ||
FROM rayproject/ray:2.41.0-py310-cu118 AS base | ||
|
||
# Maintainer label | ||
LABEL maintainer="DoEKS" | ||
|
||
# Set environment variables to non-interactive (this prevents some prompts) | ||
ENV DEBIAN_FRONTEND=non-interactive | ||
|
||
# Set LD_LIBRARY_PATH to include the directory with libpython3.10.so.1.0 | ||
ENV LD_LIBRARY_PATH=/home/ray/anaconda3/lib:$LD_LIBRARY_PATH | ||
|
||
# Set the working directory | ||
WORKDIR /app | ||
|
||
# Install vLLM and other dependencies in a single RUN command to reduce layers | ||
RUN pip install vllm==0.7.0 huggingface_hub==0.27.1 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
--- | ||
apiVersion: v1 | ||
kind: Namespace | ||
metadata: | ||
name: open-webui | ||
|
||
--- | ||
apiVersion: apps/v1 | ||
kind: Deployment | ||
metadata: | ||
name: open-webui | ||
namespace: open-webui | ||
labels: | ||
app: open-webui | ||
spec: | ||
replicas: 1 | ||
selector: | ||
matchLabels: | ||
app: open-webui | ||
template: | ||
metadata: | ||
labels: | ||
app: open-webui | ||
spec: | ||
containers: | ||
- name: open-webui | ||
image: ghcr.io/open-webui/open-webui:main | ||
ports: | ||
- containerPort: 8080 | ||
resources: | ||
requests: | ||
cpu: "500m" | ||
memory: "500Mi" | ||
limits: | ||
cpu: "1000m" | ||
memory: "1Gi" | ||
env: | ||
# This is the vllm k8s service URL to which Open-WebUI client connects to. | ||
- name: OPENAI_API_BASE_URLS | ||
value: "http://vllm-serve-svc.rayserve-vllm.svc.cluster.local:8000/v1" | ||
- name: OPENAI_API_KEY | ||
value: "dummy" # Replace with actual API key if required | ||
volumeMounts: | ||
- name: webui-volume | ||
mountPath: /app/backend/data | ||
volumes: | ||
- name: webui-volume | ||
emptyDir: {} | ||
|
||
--- | ||
apiVersion: v1 | ||
kind: Service | ||
metadata: | ||
name: open-webui | ||
namespace: open-webui | ||
labels: | ||
app: open-webui | ||
spec: | ||
type: ClusterIP | ||
selector: | ||
app: open-webui | ||
ports: | ||
- protocol: TCP | ||
port: 80 | ||
targetPort: 8080 |
Oops, something went wrong.