Skip to content
Snippets Groups Projects
Commit 93958d28 authored by Fabian Rybinski's avatar Fabian Rybinski
Browse files

Add new file

parent 46812071
No related branches found
No related tags found
No related merge requests found
name: "aie-gemma-finetuned"
description: |
This is a model which is currently tested.
config_file: |
name: aie-gemma-finetuned
mmap: true
backend: llama
f16: true
gpu_layers: 35
threads: 12
parameters:
model: downloads/llama_backend/AIE_Gemma2_2B_IT_Q4_K_M.gguf
roles:
assistant: 'Assistant:'
system: 'System:'
user: 'User:'
template:
chat_message: |-
<start_of_turn>{{if eq .RoleName "assistant" }}model{{else}}{{ .RoleName }}{{end}}
{{ if .Content -}}
{{.Content -}}
{{ end -}}<end_of_turn>
chat: |
{{.Input }}
<start_of_turn>model
completion: |
{{.Input}}
stopwords:
- '<|im_end|>'
- '<end_of_turn>'
- '<start_of_turn>'
context_size: 4096
usage: |
curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{
"model": "gpt-4",
"messages": [{"role": "user", "content": "How are you doing?", "temperature": 0.1}]
}'
files:
- filename: "downloads/llama_backend/AIE_Gemma2_2B_IT_Q4_K_M.gguf"
sha256: ""
uri: "https://huggingface.co/Phabby/AIE-Gemma-2-2B-IT/blob/main/AIE_Gemma2_2B_IT_Q4_K_M.gguf"
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment