Skip to content

Commit

Permalink
chore: add gemma 1.1 model (#149)
Browse files Browse the repository at this point in the history
Signed-off-by: Sertac Ozercan <[email protected]>
  • Loading branch information
sozercan authored May 26, 2024
1 parent dfcf93e commit b84272c
Show file tree
Hide file tree
Showing 3 changed files with 41 additions and 0 deletions.
1 change: 1 addition & 0 deletions .github/workflows/patch-models.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@ jobs:
- ghcr.io/sozercan/llama3:70b
- ghcr.io/sozercan/mixtral:8x7b
- ghcr.io/sozercan/phi3:3.8b
- ghcr.io/sozercan/gemma1.1:2b
steps:
- uses: jlumbroso/free-disk-space@54081f138730dfa15788a46383842cd2f914a1be # v1.3.1
with:
Expand Down
1 change: 1 addition & 0 deletions .github/workflows/update-models.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@ jobs:
- llama-2-13b-chat
- llama-3-8b-instruct
- phi-3-3.8b
- gemma-1.1-2b-instruct
runs-on: ubuntu-latest
timeout-minutes: 360
steps:
Expand Down
39 changes: 39 additions & 0 deletions models/gemma-1.1-2b-instruct.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
#syntax=ghcr.io/sozercan/aikit:latest
apiVersion: v1alpha1
debug: true
runtime: cuda
models:
- name: gemma-1.1-2b-instruct
source: https://huggingface.co/lmstudio-community/gemma-1.1-2b-it-GGUF/resolve/main/gemma-1.1-2b-it-Q4_K_M.gguf
sha256: cc2118e1d780fa33582738d8c99223d62c8734b06ef65076c01618d484d081d4
promptTemplates:
- name: chatMsg
template: |
<start_of_turn>user
{{if .Content }}{{ .Content }}{{ end }}<end_of_turn>
- name: chat
template: |
{{ .Input }}
<start_of_turn>model
- name: completion
template: |
{{ .Input }}
config: |
- name: gemma-1.1-2b-instruct
backend: llama
parameters:
model: gemma-1.1-2b-it-Q4_K_M.gguf
context_size: 8192
template:
chat_message: chatMsg
chat: chat
completion: completion
repeat_penalty: 1
stopwords:
- \"<start_of_turn>\"
- \"<end_of_turn>\"
- \"<eos>\"
gpu_layers: 35
f16: true
batch: 512
mmap: true

0 comments on commit b84272c

Please sign in to comment.