rajivmehtaflex · May 28, 2024 05:05
diff --git a/.args b/.args
 --model
 /workspace/codesandbox-template-blank/llamafile/AutoCoder_S_6.gguf
 --server
 --host
 0.0.0.0
 -ngl
 100
 ...
diff --git a/Standalone-LLM-Server-Creations.txt b/Standalone-LLM-Server-Creations.txt
 Test gguf file
 	- Download llamafile
     - Download/Create gruff file
 	./llamafile -m ./AutoCoder_S_6.gguf —server —port 8889 —temp 0.3

 Create standalone llm server
 	- Create .args file
    
  - Compile to server	
 		cp llamafile AutoCoder.llamafile
 		./zipalign -j0 AutoCoder.llamafile AutoCoder_S_6.gguf .args
 		./AutoCoder.llamafile
 		./AutoCoder.llamafile --port 8890

 curl http://localhost:8080/v1/chat/completions \
                  ‐H "Content‐Type: application/json" ‐d ‘{
               "model": "/workspace/codesandbox-template-blank/llamafile/AutoCoder_S_6.gguf",
               "stream": true,
               "messages": [
                 {
                   "role": "system",
                   "content": "You are a poetic assistant."
                 },
                 {
                   "role": "user",
                   "content": "Compose a poem that explains FORTRAN."
                 }
               ]
             }’
	--model
	/workspace/codesandbox-template-blank/llamafile/AutoCoder_S_6.gguf
	--server
	--host
	0.0.0.0
	-ngl
	100
	...
	Test gguf file
	- Download llamafile
	- Download/Create gruff file
	./llamafile -m ./AutoCoder_S_6.gguf —server —port 8889 —temp 0.3

	Create standalone llm server
	- Create .args file

	- Compile to server
	cp llamafile AutoCoder.llamafile
	./zipalign -j0 AutoCoder.llamafile AutoCoder_S_6.gguf .args
	./AutoCoder.llamafile
	./AutoCoder.llamafile --port 8890

	curl http://localhost:8080/v1/chat/completions \
	‐H "Content‐Type: application/json" ‐d ‘{
	"model": "/workspace/codesandbox-template-blank/llamafile/AutoCoder_S_6.gguf",
	"stream": true,
	"messages": [
	{
	"role": "system",
	"content": "You are a poetic assistant."
	},
	{
	"role": "user",
	"content": "Compose a poem that explains FORTRAN."
	}
	]
	}’