Skip to content

Commit ac1ae60

Browse files
committed
models(gallery): add hermes-2-theta-llama-3-70b
Signed-off-by: Ettore Di Giacinto <[email protected]>
1 parent 70a2bfe commit ac1ae60

File tree

2 files changed

+36
-34
lines changed

2 files changed

+36
-34
lines changed

gallery/hermes-2-pro-mistral.yaml

Lines changed: 13 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -7,47 +7,26 @@ config_file: |
77
stopwords:
88
- "<|im_end|>"
99
- "<dummy32000>"
10-
- "</tool_call>"
1110
- "<|eot_id|>"
1211
- "<|end_of_text|>"
1312
function:
14-
# disable injecting the "answer" tool
1513
disable_no_action: true
16-
17-
grammar:
18-
# This allows the grammar to also return messages
19-
mixed_mode: true
20-
2114
return_name_in_function_response: true
22-
# Without grammar uncomment the lines below
23-
# Warning: this is relying only on the capability of the
24-
# LLM model to generate the correct function call.
15+
grammar:
16+
# Uncomment the line below to enable grammar matching for JSON results if the model is breaking
17+
# the output. This will make the model more accurate and won't break the JSON output.
18+
# This however, will make parallel_calls not functional (it is a known bug)
19+
# mixed_mode: true
20+
parallel_calls: true
21+
expect_strings_after_json: true
2522
json_regex_match:
2623
- "(?s)<tool_call>(.*?)</tool_call>"
27-
- "(?s)<tool_call>(.*?)"
24+
- "(?s)<tool_call>(.*)"
25+
capture_llm_results:
26+
- (?s)<scratchpad>(.*?)</scratchpad>
2827
replace_llm_results:
29-
# Drop the scratchpad content from responses
30-
- key: "(?s)<scratchpad>.*</scratchpad>"
31-
value: ""
32-
replace_function_results:
33-
# Replace everything that is not JSON array or object
34-
- key: '(?s)^[^{\[]*'
35-
value: ""
36-
- key: '(?s)[^}\]]*$'
37-
value: ""
38-
- key: "'([^']*?)'"
39-
value: "_DQUOTE_${1}_DQUOTE_"
40-
- key: '\\"'
41-
value: "__TEMP_QUOTE__"
42-
- key: "\'"
43-
value: "'"
44-
- key: "_DQUOTE_"
45-
value: '"'
46-
- key: "__TEMP_QUOTE__"
47-
value: '"'
48-
# Drop the scratchpad content from responses
49-
- key: "(?s)<scratchpad>.*</scratchpad>"
50-
value: ""
28+
- key: (?s)<scratchpad>(.*?)</scratchpad>
29+
value: ""
5130
5231
template:
5332
chat: |
@@ -73,7 +52,7 @@ config_file: |
7352
{{- end }}<|im_end|>
7453
completion: |
7554
{{.Input}}
76-
function: |-
55+
function: |
7756
<|im_start|>system
7857
You are a function calling AI model.
7958
Here are the available tools:

gallery/index.yaml

Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2325,6 +2325,29 @@
23252325
- filename: "Hermes-2-Pro-Llama-3-Instruct-Merged-DPO-Q4_K_M.gguf"
23262326
sha256: "762b9371a296ab2628592b9462dc676b27d881a3402816492801641a437669b3"
23272327
uri: "huggingface://NousResearch/Hermes-2-Theta-Llama-3-8B-GGUF/Hermes-2-Pro-Llama-3-Instruct-Merged-DPO-Q4_K_M.gguf"
2328+
- !!merge <<: *hermes-2-pro-mistral
2329+
name: "hermes-2-theta-llama-3-70b"
2330+
icon: https://cdn-uploads.huggingface.co/production/uploads/6317aade83d8d2fd903192d9/P4NxBFwfBbboNZVytpn45.png
2331+
tags:
2332+
- llm
2333+
- gguf
2334+
- gpu
2335+
- llama3
2336+
- cpu
2337+
- function-calling
2338+
description: |
2339+
Hermes-2 Θ (Theta) 70B is the continuation of our experimental merged model released by Nous Research, in collaboration with Charles Goddard and Arcee AI, the team behind MergeKit.
2340+
2341+
Hermes-2 Θ is a merged and then further RLHF'ed version our excellent Hermes 2 Pro model and Meta's Llama-3 Instruct model to form a new model, Hermes-2 Θ, combining the best of both worlds of each model.
2342+
urls:
2343+
- https://huggingface.co/NousResearch/Hermes-2-Theta-Llama-3-70B-GGUF
2344+
overrides:
2345+
parameters:
2346+
model: Hermes-2-Theta-Llama-3-70B-Q4_K_M.gguf
2347+
files:
2348+
- filename: "Hermes-2-Theta-Llama-3-70B-Q4_K_M.gguf"
2349+
sha256: " b3965f671c35d09da8b903218f5bbaac94efdd9000e4fe4a2bac87fcac9f664e"
2350+
uri: "huggingface://NousResearch/Hermes-2-Theta-Llama-3-70B-GGUF/Hermes-2-Theta-Llama-3-70B-Q4_K_M.gguf"
23282351
### LLAMA3 version
23292352
- !!merge <<: *hermes-2-pro-mistral
23302353
name: "hermes-2-pro-llama-3-8b"

0 commit comments

Comments
 (0)