From 88fb81a779f905eff3a87b9ad6d0e32b60c488af Mon Sep 17 00:00:00 2001
From: minmin-intel <minmin.hou@intel.com>
Date: Mon, 2 Dec 2024 15:37:37 -0800
Subject: [PATCH] update llm judge model

---
 .../agent_eval/crag_eval/docker/launch_eval_container.sh        | 2 +-
 .../run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml | 2 +-
 .../run_benchmark/llm_judge/launch_llm_judge_endpoint.sh        | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh b/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh
index 681e79e9..cf25502f 100644
--- a/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh
+++ b/evals/evaluation/agent_eval/crag_eval/docker/launch_eval_container.sh
@@ -4,4 +4,4 @@
 volume=$WORKDIR
 host_ip=$(hostname -I | awk '{print $1}')
 
-docker run -it --name rag_eval -v $volume:/home/user/ -e WORKDIR=/home/user -e HF_HOME=/home/user/hf_cache -e host_ip=$host_ip -e http_proxy=$http_proxy -e https_proxy=$https_proxy crag-eval:v1.1
+docker run -it --name crag_eval -v $volume:/home/user/ -e WORKDIR=/home/user -e HF_HOME=/home/user/hf_cache -e host_ip=$host_ip -e http_proxy=$http_proxy -e https_proxy=$https_proxy crag-eval:v1.1
diff --git a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml
index 572011ef..1ba0962a 100644
--- a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml
+++ b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/docker-compose-llm-judge-gaudi.yaml
@@ -3,7 +3,7 @@
 
 services:
   tgi-service:
-    image: ghcr.io/huggingface/tgi-gaudi:latest
+    image: ghcr.io/huggingface/tgi-gaudi:2.0.5
     container_name: tgi-server
     ports:
       - "8085:80"
diff --git a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh
index 0cb08d8f..1a57cd56 100644
--- a/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh
+++ b/evals/evaluation/agent_eval/crag_eval/run_benchmark/llm_judge/launch_llm_judge_endpoint.sh
@@ -1,7 +1,7 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-export LLM_MODEL_ID="meta-llama/Meta-Llama-3-70B-Instruct"
+export LLM_MODEL_ID="meta-llama/Meta-Llama-3.1-70B-Instruct"
 export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
 export HF_CACHE_DIR=${HF_CACHE_DIR}
 docker compose -f docker-compose-llm-judge-gaudi.yaml up -d