ollama      1107  0.0  0.0 2977364 61024 ?       Ssl  Jul04   0:12 /usr/local/bin/ollama serve
root        3531  0.1  0.6 8246444 871340 pts/1  Sl+  Jul04   5:28 python3 -m vllm.entrypoints.openai.api_server --gpu-memory-utilization 0.95 --model=meta-llama/Llama-3.2-11B-Vision-Instruct --tokenizer=meta-llama/Llama-3.2-11B-Vision-Instruct --download-dir=/var/www/.cache/huggingface/hub --dtype=bfloat16 --device=auto --host=77.68.79.111 --port=5000 --max-model-len=8192 --quantization=fp8 --enforce_eager --max_num_seqs=8 --enable_chunked-prefill=false
www-data  887600  0.0  0.0   2576   900 ?        S    02:42   0:00 sh -c ps aux | grep llama
www-data  887602  0.0  0.0   3324  1472 ?        S    02:42   0:00 grep llama