nvidia-rag/variables.env at main · cloudian/nvidia-rag · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
# ==== For NVIDIA AI WORKBENCH Users Only! ====
# Set environment variables in the format KEY=VALUE, 1 per line
# This file will be sourced inside the project container when started.
# NOTE: If you change this file while the project is running, you must restart the project container for changes to take effect.

# ==== Flag for AI Workbench env ====
AI_WORKBENCH=true

# ==== Default docker volumes ====
DATASET_ROOT=ingest
DOCKER_VOLUME_DIRECTORY=vectordb

# ==== Set User for local NIM deployment ====
# USERID=$(id -u)

# ==== Endpoints for using on-prem NIMs ====
APP_LLM_SERVERURL=nim-llm:8000
APP_EMBEDDINGS_SERVERURL=nemoretriever-embedding-ms:8000/v1
APP_RANKING_SERVERURL=nemoretriever-ranking-ms:8000
OCR_GRPC_ENDPOINT=nemoretriever-ocr:8001
OCR_HTTP_ENDPOINT=http://nemoretriever-ocr:8000/v1/infer
OCR_INFER_PROTOCOL=grpc
OCR_MODEL_NAME=scene_text_ensemble
YOLOX_GRPC_ENDPOINT=page-elements:8001
YOLOX_INFER_PROTOCOL=grpc
YOLOX_GRAPHIC_ELEMENTS_GRPC_ENDPOINT=graphic-elements:8001
YOLOX_GRAPHIC_ELEMENTS_INFER_PROTOCOL=grpc
YOLOX_TABLE_STRUCTURE_GRPC_ENDPOINT=table-structure:8001
YOLOX_TABLE_STRUCTURE_INFER_PROTOCOL=grpc

# ==== Endpoints for using cloud NIMs ===
# APP_EMBEDDINGS_SERVERURL=""
# APP_LLM_SERVERURL=""
# APP_RANKING_SERVERURL=""
# OCR_HTTP_ENDPOINT=https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-ocr
# OCR_INFER_PROTOCOL=http
# OCR_MODEL_NAME=scene_text_ensemble
# YOLOX_HTTP_ENDPOINT=https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-page-elements-v3
# YOLOX_INFER_PROTOCOL=http
# YOLOX_GRAPHIC_ELEMENTS_HTTP_ENDPOINT=https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-graphic-elements-v1
# YOLOX_GRAPHIC_ELEMENTS_INFER_PROTOCOL=http
# YOLOX_TABLE_STRUCTURE_HTTP_ENDPOINT=https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-table-structure-v1
# YOLOX_TABLE_STRUCTURE_INFER_PROTOCOL=http


# Set GPU IDs for local deployment
# ==== LLM ====
LLM_MS_GPU_ID=1

# ==== Embeddings ====
EMBEDDING_MS_GPU_ID=0

# ==== Reranker ====
RANKING_MS_GPU_ID=0

# ==== Vector DB GPU ID ====
VECTORSTORE_GPU_DEVICE_ID=0

# ==== Ingestion NIMs GPU ids ====
YOLOX_MS_GPU_ID=0
YOLOX_GRAPHICS_MS_GPU_ID=0
YOLOX_TABLE_MS_GPU_ID=0
OCR_MS_GPU_ID=0

# ==== Enable Accuracy Profile ====
# APP_NVINGEST_ENABLEPDFSPLITTER=False
# APP_NVINGEST_CHUNKSIZE=1024
# APP_NVINGEST_CHUNKOVERLAP=150
# ENABLE_RERANKER=True
# VECTOR_DB_TOPK=100

# ==== Enable Perf Profile ====
# APP_NVINGEST_ENABLEPDFSPLITTER=True
# APP_NVINGEST_CHUNKSIZE=512
# APP_NVINGEST_CHUNKOVERLAP=150
# ENABLE_RERANKER=False
# VECTOR_DB_TOPK=4
# APP_RETRIEVER_TOPK=10