-
Notifications
You must be signed in to change notification settings - Fork 235
/
Copy pathdeploy.yaml
85 lines (78 loc) · 1.92 KB
/
deploy.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
---
version: "2.0"
services:
dkn:
image: firstbatch/dkn-compute-node:v0.2.28
expose:
- port: 80
as: 80
to:
- global: true
env:
# You need to provide a wallet private key here
- DKN_WALLET_SECRET_KEY=
# You can modify list of supported/enabled models - check the resources, might need a bump with more/different models
- DKN_MODELS=,llama3.1:latest
# You can provide API keys to integrate with other services
- OPENAI_API_KEY=
- SERPER_API_KEY=
- BROWSERLESS_TOKEN=
- ANTHROPIC_API_KEY=
# You probably don't want to touch these
- OLLAMA_AUTO_PULL=true
- OLLAMA_HOST=http://ollama
- OLLAMA_PORT=11434
- RUST_LOG=none,dkn_compute=debug,dkn_workflows=debug,dkn_p2p=debug,ollama_workflows=info
- DKN_ADMIN_PUBLIC_KEY=0208ef5e65a9c656a6f92fb2c770d5d5e2ecffe02a6aade19207f75110be6ae658
ollama:
image: ollama/ollama@sha256:a45c1ae866f0ad115b5b2b5048cb80e02a8c49c36f60d49f449b0d6a3825cdbf #this is the image `latest` pointed to on 2024-08-19, update if needed
expose:
- port: 11434
as: 11434
to:
- global: false
- service: dkn
profiles:
compute:
dkn:
resources:
cpu:
units: 2
memory:
size: 2Gi
storage:
- size: 1Gi
ollama:
resources:
cpu:
units: 4
memory:
size: 10Gi
storage:
- size: 24Gi
gpu:
units: 1
attributes:
vendor:
nvidia:
- model: rtx3090 #or e.g. rtx3070, 8Gi
ram: 24Gi
interface: pcie
placement:
dcloud:
pricing:
dkn:
denom: uakt
amount: 100000
ollama:
denom: uakt
amount: 100000
deployment:
dkn:
dcloud:
profile: dkn
count: 1
ollama:
dcloud:
profile: ollama
count: 1