From 88fb81a779f905eff3a87b9ad6d0e32b60c488af Mon Sep 17 00:00:00 2001 From: minmin-intel Date: Mon, 2 Dec 2024 15:37:37 -0800 Subject: [PATCH] update llm judge model --- .../agent_eval/crag_eval/docker/launch_eval_container.sh | 2 +- .../run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml | 2 +- .../run_benchmark/llm_judge/launch_llm_judge_endpoint.sh | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh b/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh index 681e79e9..cf25502f 100644 --- a/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh +++ b/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh @@ -4,4 +4,4 @@ volume=$WORKDIR host_ip=$(hostname -I | awk '{print $1}') -docker run -it --name rag_eval -v $volume:/home/user/ -e WORKDIR=/home/user -e HF_HOME=/home/user/hf_cache -e host_ip=$host_ip -e http_proxy=$http_proxy -e https_proxy=$https_proxy crag-eval:v1.1 +docker run -it --name crag_eval -v $volume:/home/user/ -e WORKDIR=/home/user -e HF_HOME=/home/user/hf_cache -e host_ip=$host_ip -e http_proxy=$http_proxy -e https_proxy=$https_proxy crag-eval:v1.1 diff --git a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml index 572011ef..1ba0962a 100644 --- a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml +++ b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml @@ -3,7 +3,7 @@ services: tgi-service: - image: ghcr.io/huggingface/tgi-gaudi:latest + image: ghcr.io/huggingface/tgi-gaudi:2.0.5 container_name: tgi-server ports: - "8085:80" diff --git a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh index 0cb08d8f..1a57cd56 100644 --- a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh +++ b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh @@ -1,7 +1,7 @@ # Copyright (C) 2024 Intel Corporation # SPDX-License-Identifier: Apache-2.0 -export LLM_MODEL_ID="meta-llama/Meta-Llama-3-70B-Instruct" +export LLM_MODEL_ID="meta-llama/Meta-Llama-3.1-70B-Instruct" export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN} export HF_CACHE_DIR=${HF_CACHE_DIR} docker compose -f docker-compose-llm-judge-gaudi.yaml up -d