-
Notifications
You must be signed in to change notification settings - Fork 22
/
vectordb.yaml
125 lines (125 loc) · 3.07 KB
/
vectordb.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
name: VectorDB
description: A Tembo Postgres Stack configured to support vector data types, storage, and operations.
repository: "quay.io/tembo"
organization: tembo
images:
14: "standard-cnpg:14-389a437"
15: "standard-cnpg:15-389a437"
16: "standard-cnpg:16-389a437"
stack_version: 0.1.0
appServices:
- image: quay.io/tembo/vector-serve:2a7cdb3
name: embeddings
env:
- name: TMPDIR
value: /models
- name: BATCH_SIZE
value: "1000"
- name: XDG_CACHE_HOME
value: /models/.cache
routing:
- port: 3000
ingressPath: /vectordb
middlewares:
- map-embeddings
middlewares:
- !replacePathRegex
name: map-embeddings
config:
regex: ^\/vectordb\/?
replacement: /v1/embeddings
resources:
requests:
cpu: 500m
memory: 1500Mi
limits:
cpu: 4000m
memory: 1500Mi
storage:
volumeMounts:
- mountPath: /models
name: hf-data-vol
volumes:
- ephemeral:
volumeClaimTemplate:
spec:
accessModes:
- ReadWriteOnce
resources:
requests:
storage: 2Gi
name: hf-data-vol
probes:
readiness:
path: /ready
port: 3000
initialDelaySeconds: 10
liveness:
path: /alive
port: 3000
initialDelaySeconds: 10
trunk_installs:
- name: pgmq
version: 1.1.1
- name: vectorize
version: 0.15.0
- name: pgvector
version: 0.7.0
- name: pg_stat_statements
version: 1.10.0
extensions:
- name: vector
locations:
- database: postgres
enabled: true
version: 0.7.0
- name: pg_cron
locations:
- database: postgres
enabled: true
version: 1.6.2
- name: pgmq
locations:
- database: postgres
enabled: true
version: 1.1.1
- name: vectorize
locations:
- database: postgres
enabled: true
version: 0.15.0
- name: pg_stat_statements
locations:
- database: postgres
enabled: true
version: 1.10.0
postgres_config_engine: standard
postgres_config:
- name: cron.host
value: /controller/run
- name: vectorize.host
value: postgresql:///postgres?host=/controller/run
- name: autovacuum_vacuum_cost_limit
value: -1
- name: autovacuum_vacuum_scale_factor
value: 0.05
- name: autovacuum_vacuum_insert_scale_factor
value: 0.05
- name: autovacuum_analyze_scale_factor
value: 0.05
- name: checkpoint_timeout
value: 10min
- name: track_activity_query_size
value: 2048
- name: wal_compression
value: 'on'
- name: track_io_timing
value: 'on'
- name: log_min_duration_statement # https://www.postgresql.org/docs/15/runtime-config-logging.html
value: 1000
- name: pg_stat_statements.track
value: all
- name: shared_preload_libraries
value: vectorize,pg_stat_statements,pg_cron
- name: vectorize.embedding_service_url
value: http://${NAMESPACE}-embeddings.${NAMESPACE}.svc.cluster.local:3000/v1/embeddings