Skip to content

Commit 4e5b280

Browse files
committed
feat: add latest qwen 2.5 coder models and adjust stop tokens
1 parent 3670fdf commit 4e5b280

File tree

3 files changed

+53
-6
lines changed

3 files changed

+53
-6
lines changed

src/main/java/ee/carlrobert/codegpt/completions/HuggingFaceModel.java

Lines changed: 24 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -125,12 +125,33 @@ public enum HuggingFaceModel {
125125
CODE_QWEN_2_5_1_5B_Q8_0(1, 8, "Qwen2.5-Coder-1.5B-Instruct-GGUF",
126126
"qwen2.5-coder-1.5b-instruct-q8_0.gguf", "Qwen", 1.89),
127127

128+
CODE_QWEN_2_5_3B_Q4_K_M(3, 4, "Qwen2.5-Coder-3B-Instruct-GGUF",
129+
"qwen2.5-coder-3b-instruct-q4_k_m.gguf", "Qwen", 2.10),
130+
CODE_QWEN_2_5_3B_Q6_K(3, 6, "Qwen2.5-Coder-3B-Instruct-GGUF",
131+
"qwen2.5-coder-3b-instruct-q6_k.gguf", "Qwen", 2.79),
132+
CODE_QWEN_2_5_3B_Q8_0(3, 8, "Qwen2.5-Coder-3B-Instruct-GGUF",
133+
"qwen2.5-coder-3b-instruct-q8_0.gguf", "Qwen", 3.62),
134+
128135
CODE_QWEN_2_5_7B_Q4_K_M(7, 4, "Qwen2.5-Coder-7B-Instruct-GGUF",
129-
"Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf", "bartowski", 4.68),
136+
"qwen2.5-coder-7b-instruct-q4_k_m.gguf", "Qwen", 4.68),
130137
CODE_QWEN_2_5_7B_Q6_K(7, 6, "Qwen2.5-Coder-7B-Instruct-GGUF",
131-
"Qwen2.5-Coder-7B-Instruct-Q6_K.gguf", "bartowski", 6.25),
138+
"qwen2.5-coder-7b-instruct-q6_k.gguf", "Qwen", 6.25),
132139
CODE_QWEN_2_5_7B_Q8_0(7, 8, "Qwen2.5-Coder-7B-Instruct-GGUF",
133-
"Qwen2.5-Coder-7B-Instruct-Q8_0.gguf", "bartowski", 8.1),
140+
"qwen2.5-coder-7b-instruct-q8_0.gguf", "Qwen", 8.10),
141+
142+
CODE_QWEN_2_5_14B_Q4_K_M(14, 4, "Qwen2.5-Coder-14B-Instruct-GGUF",
143+
"qwen2.5-coder-14b-instruct-q4_k_m.gguf", "Qwen", 8.99),
144+
CODE_QWEN_2_5_14B_Q6_K(14, 6, "Qwen2.5-Coder-14B-Instruct-GGUF",
145+
"qwen2.5-coder-14b-instruct-q6_k.gguf", "Qwen", 12.10),
146+
CODE_QWEN_2_5_14B_Q8_0(14, 8, "Qwen2.5-Coder-14B-Instruct-GGUF",
147+
"qwen2.5-coder-14b-instruct-q8_0.gguf", "Qwen", 15.70),
148+
149+
CODE_QWEN_2_5_32B_Q4_K_M(32, 4, "Qwen2.5-Coder-32B-Instruct-GGUF",
150+
"qwen2.5-coder-32b-instruct-q4_k_m.gguf", "Qwen", 19.90),
151+
CODE_QWEN_2_5_32B_Q6_K(32, 6, "Qwen2.5-Coder-32B-Instruct-GGUF",
152+
"qwen2.5-coder-32b-instruct-q6_k.gguf", "Qwen", 26.90),
153+
CODE_QWEN_2_5_32B_Q8_0(32, 8, "Qwen2.5-Coder-32B-Instruct-GGUF",
154+
"qwen2.5-coder-32b-instruct-q8_0.gguf", "Qwen", 34.80),
134155

135156
STABLE_CODE_3B_Q3_K_M(SC3, 3, "stable-code-instruct-3b-Q3_K_M.gguf", 1.39),
136157
STABLE_CODE_3B_Q4_K_M(SC3, 4, "stable-code-instruct-3b-Q4_K_M.gguf", 1.71),

src/main/java/ee/carlrobert/codegpt/completions/llama/LlamaModel.java

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -189,9 +189,18 @@ public enum LlamaModel {
189189
List.of(
190190
HuggingFaceModel.CODE_QWEN_2_5_1_5B_Q6_K,
191191
HuggingFaceModel.CODE_QWEN_2_5_1_5B_Q8_0,
192+
HuggingFaceModel.CODE_QWEN_2_5_3B_Q4_K_M,
193+
HuggingFaceModel.CODE_QWEN_2_5_3B_Q6_K,
194+
HuggingFaceModel.CODE_QWEN_2_5_3B_Q8_0,
192195
HuggingFaceModel.CODE_QWEN_2_5_7B_Q4_K_M,
193196
HuggingFaceModel.CODE_QWEN_2_5_7B_Q6_K,
194-
HuggingFaceModel.CODE_QWEN_2_5_7B_Q8_0)),
197+
HuggingFaceModel.CODE_QWEN_2_5_7B_Q8_0,
198+
HuggingFaceModel.CODE_QWEN_2_5_14B_Q4_K_M,
199+
HuggingFaceModel.CODE_QWEN_2_5_14B_Q6_K,
200+
HuggingFaceModel.CODE_QWEN_2_5_14B_Q8_0,
201+
HuggingFaceModel.CODE_QWEN_2_5_32B_Q4_K_M,
202+
HuggingFaceModel.CODE_QWEN_2_5_32B_Q6_K,
203+
HuggingFaceModel.CODE_QWEN_2_5_32B_Q8_0)),
195204
STABLE_CODE(
196205
"Stable Code Instruct", """
197206
stable-code-instruct-3b is a 2.7B billion parameter decoder-only language model tuned from \

src/main/kotlin/ee/carlrobert/codegpt/codecompletions/InfillPromptTemplate.kt

Lines changed: 19 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,23 @@ enum class InfillPromptTemplate(val label: String, val stopTokens: List<String>?
5050
}
5151
}
5252
},
53-
CODE_QWEN_2_5("CodeQwen2.5", listOf()) {
53+
CODE_QWEN_2_5(
54+
"CodeQwen2.5",
55+
listOf(
56+
"package ",
57+
"import ",
58+
"<|endoftext|>",
59+
"<|fim_prefix|>",
60+
"<|fim_middle|>",
61+
"<|fim_suffix|>",
62+
"<|fim_pad|>",
63+
"<|cursor|>",
64+
"<|repo_name|>",
65+
"<|file_sep|>",
66+
"<|im_start|>",
67+
"<|im_end|>"
68+
)
69+
) {
5470
override fun buildPrompt(infillDetails: InfillRequest): String {
5571
val infillPrompt =
5672
"<|fim_prefix|> ${infillDetails.prefix} <|fim_suffix|>${infillDetails.suffix} <|fim_middle|>"
@@ -110,7 +126,8 @@ enum class InfillPromptTemplate(val label: String, val stopTokens: List<String>?
110126
CODESTRAL("Codestral", listOf("</s>")) {
111127
override fun buildPrompt(infillDetails: InfillRequest): String {
112128
// see https://github.com/mistralai/mistral-common/blob/master/src/mistral_common/tokens/tokenizers/base.py
113-
val infillPrompt = "[SUFFIX]${infillDetails.suffix}[PREFIX]${infillDetails.prefix}[MIDDLE]"
129+
val infillPrompt =
130+
"[SUFFIX]${infillDetails.suffix}[PREFIX]${infillDetails.prefix}[MIDDLE]"
114131
return createDefaultMultiFilePrompt(infillDetails, infillPrompt)
115132
}
116133
};

0 commit comments

Comments
 (0)