ollama      1113  0.0  0.0 2976596 59284 ?       Ssl  Apr03   3:31 /usr/local/bin/ollama serve
root     2192665  0.1  0.6 8493248 900252 pts/1  Sl+  May15  40:14 python3 -m vllm.entrypoints.openai.api_server --gpu-memory-utilization 0.95 --model=meta-llama/Llama-3.2-11B-Vision-Instruct --tokenizer=meta-llama/Llama-3.2-11B-Vision-Instruct --download-dir=/var/www/.cache/huggingface/hub --dtype=bfloat16 --device=auto --host=77.68.79.111 --port=5000 --max-model-len=8192 --quantization=fp8 --enforce_eager --max_num_seqs=8 --enable_chunked-prefill=false
www-data 3904085  0.0  0.0   2576   936 ?        S    00:33   0:00 sh -c ps aux | grep llama
www-data 3904087  0.0  0.0   3324  1420 ?        S    00:33   0:00 grep llama