./main -m models/tinyllama-1.1b-chat-v1.0.Q5_K_M.gguf -n 500 --ignore-eos -f prompts/chat-dishes.txt
./main -m models/tinyllama-1.1b-chat-v1.0.Q5_K_M.gguf -t 3 -n 500 --ignore-eos -f prompts/chat-dishes.txt
no BLAS 4 threads
llama_print_timings: load time = 459.67 ms
llama_print_timings: sample time = 251.73 ms / 500 runs ( 0.50 ms per token, 1986.24 tokens per second)
llama_print_timings: prompt eval time = 10175.15 ms / 68 tokens ( 149.63 ms per token, 6.68 tokens per second)