-
Notifications
You must be signed in to change notification settings - Fork 13
/
.project-metadata.yaml
68 lines (64 loc) · 2.41 KB
/
.project-metadata.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
name: LLM Hands on Lab with CML
description: "Hands on Lab which demonstrates a number of concepts including web scraping, vector databases, model deployment, model usage, Langchain, application building, and instruction following/tuning."
author: "Cloudera"
date: "2023-12-20"
specification_version: 1.0
prototype_version: 1.0
# environment_variables:
# AWS_ACCESS_KEY_ID:
# description: "Access key ID for interacting with AWS Bedrock"
# prompt: "Enter your AWS Access Key ID (optional):"
# required: false
# AWS_SECRET_ACCESS_KEY:
# description: "Secret key for interacting with AWS Bedrock"
# prompt: "Enter your AWS Secret Access Key (optional):"
# required: false
# AWS_DEFAULT_REGION:
# default: "us-west-2"
# description: "AWS Region where Bedrock models are available"
# prompt: "Enter your AWS Region (default: us-west-2):"
# required: false
# PINECONE_API_KEY:
# description: "API Keys for Pinecone service"
# prompt: "Enter your Pinecone API Key (optional):"
# required: false
# PINECONE_REGION:
# default: "us-east-1"
# description: "Cloud Region within Pinecone service"
# prompt: "Enter your Pinecone Region (default: us-east-1):"
# required: false
# PINECONE_INDEX:
# description: "Index within Pinecone Environment"
# prompt: "Enter your Pinecone Index (optional):"
# required: false
runtimes:
- editor: JupyterLab
kernel: Python 3.10
edition: Nvidia GPU
tasks:
- type: run_session
name: Install Dependencies
script: 0_install_prerequisites/download_reqs_set_vars.py
short_summary: Install Dependencies
kernel: python3
cpu: 2
memory: 12
- type: run_session
name: Setup Chroma Server
script: 0_install_prerequisites/setup-chroma.py
short_summary: Setup Chroma Server Vector DB
long_summary: Resolve sqlite dependency with python version and control logging in Chroma server package
kernel: python3
cpu: 2
memory: 4
- type: create_job
name: Pull and Convert HTMLS to TXT
entity_label: htmls_to_txt
script: 2_populate_vector_db/html_to_text.py
arguments: None
short_summary: Create job to source htmls, download, and convert them to text.
long_summary: Create job to source htmls, download, and convert them to text. Update html_links.txt with the htmls you wish to download and convert.
cpu: 2
memory: 4
environment:
TASK_TYPE: CREATE/RUN_JOB