@@ -22,6 +22,9 @@ Specifies the number of layers offloaded into the GPU.
22
22
. PARAMETER modelContextLength
23
23
Specifies the models context length it was trained on.
24
24
25
+ . PARAMETER verbose
26
+ Increases the verbosity of the llama.cpp server.
27
+
25
28
. EXAMPLE
26
29
.\server.ps1 -model "..\vendor\llama.cpp\models\openchat-3.5-0106.Q5_K_M.gguf"
27
30
@@ -33,6 +36,9 @@ Specifies the models context length it was trained on.
33
36
34
37
. EXAMPLE
35
38
.\server.ps1 -model "C:\models\openchat-3.5-0106.Q5_K_M.gguf" -port 8081
39
+
40
+ . EXAMPLE
41
+ .\server.ps1 -model "..\vendor\llama.cpp\models\openchat-3.5-0106.Q5_K_M.gguf" -verbose
36
42
#>
37
43
38
44
Param (
@@ -75,6 +81,9 @@ Param (
75
81
$modelContextLength = -1
76
82
)
77
83
84
+ # The -verbose option is a default PowerShell parameter.
85
+ $verbose = $PSCmdlet.MyInvocation.BoundParameters [" Verbose" ].IsPresent -eq $true
86
+
78
87
# We are resolving the absolute path to the llama.cpp project directory.
79
88
$llamaCppPath = Resolve-Path - Path " ${PSScriptRoot} \..\vendor\llama.cpp"
80
89
@@ -251,16 +260,7 @@ Start-Job -Name 'BrowserJob' -ScriptBlock {
251
260
252
261
Write-Host " Starting llama.cpp server with custom options..." - ForegroundColor " Yellow"
253
262
254
- [PSCustomObject ]@ {
255
- " Context Size" = $contextSize
256
- " Group Attention Factor" = $groupAttentionFactor
257
- " Group Attention Width" = $groupAttentionWidth
258
- " Physical CPU Cores" = $numberOfPhysicalCores
259
- " GPU Layers" = " ${numberOfGPULayers} /${maximumNumberOfLayers} "
260
- " Parallel Slots" = " ${parallel} "
261
- } | Format-List | Out-String | ForEach-Object { $_.Trim (" `r " , " `n " ) }
262
-
263
- Invoke-Expression " ${llamaCppPath} \build\bin\Release\server ``
263
+ $command = " ${llamaCppPath} \build\bin\Release\server ``
264
264
--n-predict 1024 ``
265
265
--log-disable ``
266
266
--port '${port} ' ``
@@ -272,4 +272,9 @@ Invoke-Expression "${llamaCppPath}\build\bin\Release\server ``
272
272
--parallel '${parallel} ' ``
273
273
--grp-attn-n '${groupAttentionFactor} ' ``
274
274
--grp-attn-w '${groupAttentionWidth} ' ``
275
- $ ( if ($enableFlashAttention ) {" --flash-attn" }) "
275
+ $ ( if ($enableFlashAttention ) {" --flash-attn" }) ``
276
+ $ ( if ($verbose ) {" --verbose" }) "
277
+
278
+ Write-Host $command - ForegroundColor " Green"
279
+
280
+ Invoke-Expression $command
0 commit comments