-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy path.project-metadata.yaml
131 lines (118 loc) · 4.64 KB
/
.project-metadata.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
name: DocGenius AI - Generative AI Chatbot
description: |
Generative AI Chatbot for your Documents powered by Cloudera
author: Suri Nuthalapati
specification_version: 01.0
prototype_version: 1.0
date: "2024-04-25"
environment_variables:
VECTOR_DB:
default: "MILVUS"
description: "Enter 'MILVUS' or 'PINECONE' for your preferred Vector DB. Only 'MILVUS' or 'PINECONE' are valid options. Milvus does not require any additional setup. Pinecone will require you to create an account and generate an API key."
required: true
PINECONE_API_KEY:
default: ""
description: "Only Required for Pinecone Vector DB: Enter your API Key for Pinecone here. (Shown in API Keys page)"
PINECONE_ENVIRONMENT:
default: "gcp-starter"
description: "Only Required for Pinecone Vector DB: Enter your Pinecone environment here. (Shown in API Keys page)"
KB_VECTOR_INDEX:
default: "retail_kb"
description: "If this is not set now, it will need to be configured for the application to function."
required: true
NEXT_PUBLIC_CHATBOT_API_DOMAIN:
default: "$CDSW_DOMAIN"
description: "Required for building UI application: Enter the domain for the Chatbot API. This is the same as the CDSW_DOMAIN environment variable."
required: true
PROJECT_GIT_BRANCH:
default: "main"
description: "Enter the branch name for the git repo. The default is 'main' and can be changed to identify variations for organizations with multiple branches."
MODEL_DETAILS:
default: ""
description: "json string with model details"
required: true
HF_TOKEN:
default: ""
description: >-
Blank for Ungated Models
Provide HuggingFace Token for Gated Models.
# required: true
runtimes:
- editor: JupyterLab
kernel: Python 3.10
edition: Standard
tasks:
- type: run_session
name: Select the Git Branch
script: session/other/select_git_branch.py
short_summary: Select the Git Branch
long_summary: Select the Git Branch. The default is 'main' and can be changed to identify variations for organizations with multiple branches.
kernel: python3
cpu: 2
memory: 8
- type: run_session
name: Install Dependencies
script: session/install-deps/install_general_deps.py
short_summary: Install Dependencies for your Project
kernel: python3
cpu: 2
memory: 8
- type: create_job
name: Populate Milvus Vector DB with documents embeddings
entity_label: milvus_ingestion
script: pipeline/load_data/milvus_ingest_kb.py
arguments: None
short_summary: Create job to populate Milvus Vector Database with document embeddings. (This is the default Vector DB and will run if "MILVUS" was left or set as the Vector DB.)
long_summary: Create job to launch Milvus Vector Database locally and insert embeddings for documents. Embeddings are generated by the locally running embeddings model.
cpu: 2
memory: 8
environment:
TASK_TYPE: CREATE/RUN_JOB
- type: run_job
entity_label: milvus_ingestion
short_summary: Populate Milvus Vector DB with document embeddings
- type: start_application
name: API for Chatbot - DocGenuis AI
subdomain: docgenius-api
static_subdomain: true
script: app/main.py
short_summary: Start API for DocGenuis AI Chatbot
long_summary: Start and Publish API for DocGenius AI. Remember to enable unauthenticated app access for external access to the UI.
cpu: 2
memory: 8
environment_variables:
TASK_TYPE: START_APPLICATION
bypass_authentication: true
- type: create_job
name: Build Chatbot UI Code
entity_label: setup_chatui
script: chat-ui/setup.py
arguments: None
short_summary: Setup Node, NPM, YARN Env Setup and Build Code
long_summary: Setup Node, NPM, YARN Env Setup and Build Code
cpu: 2
memory: 8
environment:
TASK_TYPE: CREATE/RUN_JOB
- type: run_job
entity_label: setup_chatui
short_summary: Build Chatbot UI Code
- type: start_application
name: Frontend UI - DocGenius AI
subdomain: docgenius-ui
static_subdomain: true
script: chat-ui/app.py
short_summary: Start frontend UI for DocGenuis AI Chatbot
long_summary: This task will run Flask app to serve the Chatbot Frontend UI. Remember to enable unauthenticated app access for external access to the UI.
cpu: 2
memory: 8
environment_variables:
TASK_TYPE: START_APPLICATION
bypass_authentication: true
- type: run_session
name: Configure some features and flags via cmlapi after deployment
script: session/cmlapi/apply_fix_conf.py
short_summary: Configure some features and flags via cmlapi after deployment
kernel: python3
cpu: 2
memory: 8