conda create -n lmdeploy python=3.11 -y && conda activate lmdeploy
pip install lmdeploy partial_json_parser timm
lmdeploy serve api_server OpenGVLab/InternVL3-8B-Instruct --backend turbomind --server-port 23333 --tp 1 --chat-template internvl2_5