Add mistral 7b example

countzero · countzero · commit b1897ef28712 · 2023-09-28T11:55:00.000+02:00
diff --git a/examples/server_fashiongpt_70b_v1.1.ps1 b/examples/server_fashiongpt_70b_v1.1.ps1
@@ -0,0 +1,7 @@
+Start-Process "http://127.0.0.1:8080"
+
+../vendor/llama.cpp/build/bin/Release/server `
+    --model "../vendor/llama.cpp/models/FashionGPT-70B-V1.1/model-quantized-q4_K_M.gguf" `
+    --ctx-size 4096 `
+    --threads 16 `
+    --n-gpu-layers 10
diff --git a/examples/server_mistral_7b_v0.1.ps1 b/examples/server_mistral_7b_v0.1.ps1
@@ -0,0 +1,7 @@
+Start-Process "http://127.0.0.1:8080"
+
+../vendor/llama.cpp/build/bin/Release/server `
+    --model "../vendor/llama.cpp/models/Mistral-7B-v0.1/model-quantized-q4_K_M.gguf" `
+    --ctx-size 4096 `
+    --threads 16 `
+    --n-gpu-layers 35
diff --git a/examples/server_phind_codellama_34b_v2_32K.ps1 b/examples/server_phind_codellama_34b_v2_32K.ps1
@@ -8,7 +8,7 @@ Start-Process "http://127.0.0.1:8080"
 #
 ../vendor/llama.cpp/build/bin/Release/server `
     --model "../vendor/llama.cpp/models/Phind-CodeLlama-34B-v2/model-quantized-q4_K_M.gguf" `
-    --ctx-size 16384 `
+    --ctx-size 32768 `
     --rope-freq-scale 0.125 `
     --rope-freq-base 80000 `
     --threads 16 `
diff --git a/examples/server_wizardcoder_15b_v1.0.ps1 b/examples/server_wizardcoder_15b_v1.0.ps1
@@ -4,5 +4,5 @@ Start-Process "http://127.0.0.1:8080"
 ../vendor/llama.cpp/build/bin/Release/server `
     --model "../vendor/llama.cpp/models/WizardCoder-15B-V1.0/model-quantized-q4_k_M.gguf" `
     --ctx-size 2048 `
-    --threads 6 `
+    --threads 16 `
     --n-gpu-layers 0
diff --git a/vendor/llama.cpp b/vendor/llama.cpp
@@ -1 +1 @@
-Subproject commit a40f2b656fab364ce0aff98dbefe9bd9c3721cc9
+Subproject commit 20c7e1e804690f3db58bd33eb56f8c6aa4735c63

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@ Start-Process "http://127.0.0.1:8080"`
`8`	`8`	`#`
`9`	`9`	../vendor/llama.cpp/build/bin/Release/server `
`10`	`10`	--model "../vendor/llama.cpp/models/Phind-CodeLlama-34B-v2/model-quantized-q4_K_M.gguf" `
`11`		- --ctx-size 16384 `
	`11`	+ --ctx-size 32768 `
`12`	`12`	--rope-freq-scale 0.125 `
`13`	`13`	--rope-freq-base 80000 `
`14`	`14`	--threads 16 `