From 93958d28220fc18a9d136e97530afdbfff38c395 Mon Sep 17 00:00:00 2001
From: Fabian Rybinski <fabian.rybinski@kit.edu>
Date: Wed, 20 Nov 2024 08:30:46 +0000
Subject: [PATCH] Add new file

---
 aie-gemma-finetuned.yaml | 44 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 44 insertions(+)
 create mode 100644 aie-gemma-finetuned.yaml

diff --git a/aie-gemma-finetuned.yaml b/aie-gemma-finetuned.yaml
new file mode 100644
index 0000000..ca2209d
--- /dev/null
+++ b/aie-gemma-finetuned.yaml
@@ -0,0 +1,44 @@
+name: "aie-gemma-finetuned"
+
+description: |
+  This is a model which is currently tested.
+config_file: |
+  name: aie-gemma-finetuned
+  mmap: true
+  backend: llama
+  f16: true 
+  gpu_layers: 35
+  threads: 12
+  parameters:
+    model: downloads/llama_backend/AIE_Gemma2_2B_IT_Q4_K_M.gguf
+  roles:
+    assistant: 'Assistant:'
+    system: 'System:'
+    user: 'User:'
+  template:
+    chat_message: |-
+      <start_of_turn>{{if eq .RoleName "assistant" }}model{{else}}{{ .RoleName }}{{end}}
+      {{ if .Content -}}
+      {{.Content -}}
+      {{ end -}}<end_of_turn>
+    chat: |
+      {{.Input }}
+      <start_of_turn>model
+    completion: |
+      {{.Input}}
+  stopwords:
+  - '<|im_end|>'
+  - '<end_of_turn>'
+  - '<start_of_turn>'
+  context_size: 4096
+  
+
+  usage: |
+        curl http://localhost:8080/v1/chat/completions -H "Content-Type: application/json" -d '{
+            "model": "gpt-4",
+            "messages": [{"role": "user", "content": "How are you doing?", "temperature": 0.1}]
+        }'
+files:
+- filename: "downloads/llama_backend/AIE_Gemma2_2B_IT_Q4_K_M.gguf"
+  sha256: ""
+  uri: "https://huggingface.co/Phabby/AIE-Gemma-2-2B-IT/blob/main/AIE_Gemma2_2B_IT_Q4_K_M.gguf"
-- 
GitLab