diff --git a/config.properties b/config.properties index a537361..31f303a 100644 --- a/config.properties +++ b/config.properties @@ -1,5 +1,5 @@ #Llama Runner Configuration -#Sun Mar 29 16:13:49 CEST 2026 +#Sun Mar 29 17:31:07 CEST 2026 windowHeight=1189 windowWidth=711 windowX=1849 diff --git a/profiles.json b/profiles.json index ecb6717..95dc982 100644 --- a/profiles.json +++ b/profiles.json @@ -6,8 +6,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -27,8 +27,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -48,8 +48,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -69,8 +69,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -90,8 +90,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -132,8 +132,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -153,8 +153,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -174,8 +174,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -195,8 +195,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, @@ -216,8 +216,8 @@ "threads": 99, "flashAttention": true, "kvUnified": true, - "cacheTypeK": "q8_0", - "cacheTypeV": "q8_0", + "cacheTypeK": "turbo3", + "cacheTypeV": "turbo3", "temperature": 0.6, "topP": 0.95, "topK": 20, diff --git a/src/main/java/cz/kamma/llamarunner/Main.java b/src/main/java/cz/kamma/llamarunner/Main.java index 35fc625..920b5a2 100644 --- a/src/main/java/cz/kamma/llamarunner/Main.java +++ b/src/main/java/cz/kamma/llamarunner/Main.java @@ -773,7 +773,7 @@ public class Main extends JFrame { gbc.gridx = 1; gbc.weightx = 1.0; - cacheTypeKComboBox = new JComboBox<>(new String[] { "bf16", "f16", "f32", "f8", "q8_0" }); + cacheTypeKComboBox = new JComboBox<>(new String[] { "bf16", "f16", "f32", "f8", "q8_0", "turbo3", "turbo4" }); cacheTypeKComboBox.setSelectedIndex(0); cacheTypeKComboBox.addActionListener(e -> updateCommandPreview()); panel.add(cacheTypeKComboBox, gbc); @@ -785,7 +785,7 @@ public class Main extends JFrame { gbc.gridx = 1; gbc.weightx = 1.0; - cacheTypeVComboBox = new JComboBox<>(new String[] { "bf16", "f16", "f32", "f8", "q8_0" }); + cacheTypeVComboBox = new JComboBox<>(new String[] { "bf16", "f16", "f32", "f8", "q8_0", "turbo3", "turbo4" }); cacheTypeVComboBox.setSelectedIndex(0); cacheTypeVComboBox.addActionListener(e -> updateCommandPreview()); panel.add(cacheTypeVComboBox, gbc);