profiles changed
This commit is contained in:
parent
d1358cc6d3
commit
1f297a41a7
@ -1,5 +1,5 @@
|
|||||||
#Llama Runner Configuration
|
#Llama Runner Configuration
|
||||||
#Sun Mar 29 17:54:05 CEST 2026
|
#Thu Apr 02 10:20:00 CEST 2026
|
||||||
windowHeight=1189
|
windowHeight=1189
|
||||||
windowWidth=711
|
windowWidth=711
|
||||||
windowX=1849
|
windowX=1849
|
||||||
|
|||||||
@ -3,6 +3,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -24,6 +25,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -45,6 +47,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -66,6 +69,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -87,6 +91,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -108,6 +113,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -129,6 +135,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -150,6 +157,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -171,6 +179,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -192,6 +201,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -213,6 +223,7 @@
|
|||||||
"host": "0.0.0.0",
|
"host": "0.0.0.0",
|
||||||
"port": 3080,
|
"port": 3080,
|
||||||
"parallel": 1,
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
"threads": 99,
|
"threads": 99,
|
||||||
"flashAttention": true,
|
"flashAttention": true,
|
||||||
"kvUnified": true,
|
"kvUnified": true,
|
||||||
@ -229,5 +240,27 @@
|
|||||||
"ngl": -1,
|
"ngl": -1,
|
||||||
"fit": true,
|
"fit": true,
|
||||||
"reasoning": true
|
"reasoning": true
|
||||||
|
},
|
||||||
|
"Qwen35-35B-A3B-Q6K-turbo4-256k": {
|
||||||
|
"host": "0.0.0.0",
|
||||||
|
"port": 3080,
|
||||||
|
"parallel": 1,
|
||||||
|
"batchSize": 2048,
|
||||||
|
"threads": 99,
|
||||||
|
"flashAttention": true,
|
||||||
|
"kvUnified": true,
|
||||||
|
"cacheTypeK": "turbo4",
|
||||||
|
"cacheTypeV": "turbo4",
|
||||||
|
"temperature": 0.6,
|
||||||
|
"topP": 0.95,
|
||||||
|
"topK": 20,
|
||||||
|
"minP": 0.0,
|
||||||
|
"ctxSize": 256000,
|
||||||
|
"enableThinking": false,
|
||||||
|
"modelPath": "/home/kamma/models/Qwen3.5-35B-A3B-Q6_K.gguf",
|
||||||
|
"chatTemplateKwargs": "{\"enable_thinking\": true}",
|
||||||
|
"ngl": 999,
|
||||||
|
"fit": true,
|
||||||
|
"reasoning": true
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
Loading…
x
Reference in New Issue
Block a user