eacortes commited on
Commit
2807e98
·
1 Parent(s): 44df690

fix: reduce vector index resource

Browse files
Files changed (3) hide show
  1. Dockerfile +1 -2
  2. redis.conf +1 -1
  3. src/constants.py +2 -2
Dockerfile CHANGED
@@ -15,10 +15,9 @@ COPY redis.conf .
15
  ENV REDIS_HOST=localhost
16
  ENV REDIS_PORT=6379
17
 
 
18
  ENV TRANSFORMERS_CACHE=/tmp/.cache/huggingface/transformers
19
  ENV HF_HOME=/tmp/.cache/huggingface
20
  ENV SENTENCE_TRANSFORMERS_HOME=/tmp/.cache/sentence_transformers
21
 
22
- COPY ./src ./src
23
-
24
  CMD ["sh", "-c", "redis-server redis.conf & python3 src/app.py"]
 
15
  ENV REDIS_HOST=localhost
16
  ENV REDIS_PORT=6379
17
 
18
+ COPY ./src ./src
19
  ENV TRANSFORMERS_CACHE=/tmp/.cache/huggingface/transformers
20
  ENV HF_HOME=/tmp/.cache/huggingface
21
  ENV SENTENCE_TRANSFORMERS_HOME=/tmp/.cache/sentence_transformers
22
 
 
 
23
  CMD ["sh", "-c", "redis-server redis.conf & python3 src/app.py"]
redis.conf CHANGED
@@ -2,4 +2,4 @@ loadmodule /opt/redis-stack/lib/redisearch.so
2
 
3
  maxmemory 768mb
4
 
5
- dir /data
 
2
 
3
  maxmemory 768mb
4
 
5
+ dir /tmp
src/constants.py CHANGED
@@ -13,10 +13,10 @@ HNSW_PARAMETERS = {
13
  # Defines the initial capacity of the vector index. It helps in pre-allocating space for the index.
14
  "INITIAL_CAP": 440,
15
  # Max number of outgoing edges (connections) for each node in a graph layer.
16
- "M": 32,
17
  # Max number of connected neighbors to consider during graph building.
18
  # Higher values increase accuracy, but also increase index build time.
19
- "EF_CONSTRUCTION": 512,
20
  # Max top candidates during KNN search. Higher values increase accuracy, but also increase search latency.
21
  "EF_RUNTIME": 10,
22
  }
 
13
  # Defines the initial capacity of the vector index. It helps in pre-allocating space for the index.
14
  "INITIAL_CAP": 440,
15
  # Max number of outgoing edges (connections) for each node in a graph layer.
16
+ "M": 16,
17
  # Max number of connected neighbors to consider during graph building.
18
  # Higher values increase accuracy, but also increase index build time.
19
+ "EF_CONSTRUCTION": 256,
20
  # Max top candidates during KNN search. Higher values increase accuracy, but also increase search latency.
21
  "EF_RUNTIME": 10,
22
  }