File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
VisualQnA/docker_compose/amd/gpu/rocm Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -30,7 +30,7 @@ services:
30
30
security_opt :
31
31
- seccomp:unconfined
32
32
- apparmor=unconfined
33
- command : " --model ${VISUALQNA_LLM_MODEL_ID } --swap-space 16 --disable-log-requests --dtype float16 --tensor-parallel-size 1 --host 0.0.0.0 --port 8011 --num-scheduler-steps 1 --distributed-executor-backend \" mp\" "
33
+ command : " --model ${VISUALQNA_LVM_MODEL_ID } --swap-space 16 --disable-log-requests --dtype float16 --tensor-parallel-size 1 --host 0.0.0.0 --port 8011 --num-scheduler-steps 1 --distributed-executor-backend \" mp\" "
34
34
ipc : host
35
35
lvm :
36
36
image : ${REGISTRY:-opea}/lvm:${TAG:-latest}
@@ -46,7 +46,7 @@ services:
46
46
https_proxy : ${https_proxy}
47
47
LVM_COMPONENT_NAME : " OPEA_VLLM_LVM"
48
48
LVM_ENDPOINT : ${LVM_ENDPOINT}
49
- LLM_MODEL_ID : ${VISUALQNA_LLM_MODEL_ID }
49
+ LLM_MODEL_ID : ${VISUALQNA_LVM_MODEL_ID }
50
50
HF_HUB_DISABLE_PROGRESS_BARS : 1
51
51
HF_HUB_ENABLE_HF_TRANSFER : 0
52
52
restart : unless-stopped
Original file line number Diff line number Diff line change @@ -9,7 +9,7 @@ export VISUALQNA_VLLM_SERVICE_PORT="8081"
9
9
export VISUALQNA_HUGGINGFACEHUB_API_TOKEN=${Your_HUGGINGFACEHUB_API_TOKEN}
10
10
export VISUALQNA_CARD_ID=" card1"
11
11
export VISUALQNA_RENDER_ID=" renderD136"
12
- export VISUALQNA_LLM_MODEL_ID =" Xkev/Llama-3.2V-11B-cot"
12
+ export VISUALQNA_LVM_MODEL_ID =" Xkev/Llama-3.2V-11B-cot"
13
13
export LVM_ENDPOINT=" http://${HOST_IP} :${VISUALQNA_VLLM_SERVICE_PORT} "
14
14
export LVM_SERVICE_PORT=9399
15
15
export MEGA_SERVICE_HOST_IP=${HOST_IP}
You can’t perform that action at this time.
0 commit comments