From 65619da8a0c9f263458af5a22d330d2ff1a20200 Mon Sep 17 00:00:00 2001 From: ishaansehgal99 Date: Wed, 8 Jan 2025 13:34:51 -0800 Subject: [PATCH 1/2] fix: Address misnamed paths --- README.md | 4 +- config/manager/kustomization.yaml | 2 +- docs/How-to-use-kaito-in-aks-arc.md | 2 +- .../reference-image-deployment.yaml | 2 +- docs/rag-todos.yaml | 53 +++++++++++++++++++ terraform/kaito.tf | 4 +- 6 files changed, 60 insertions(+), 7 deletions(-) create mode 100644 docs/rag-todos.yaml diff --git a/README.md b/README.md index 6b4ccdc63..072286679 100644 --- a/README.md +++ b/README.md @@ -1,8 +1,8 @@ # Kubernetes AI Toolchain Operator (Kaito) -![GitHub Release](https://img.shields.io/github/v/release/Azure/kaito) +![GitHub Release](https://img.shields.io/github/v/release/kaito-project/kaito) [![Go Report Card](https://goreportcard.com/badge/github.com/kaito-project/kaito)](https://goreportcard.com/report/github.com/kaito-project/kaito) -![GitHub go.mod Go version](https://img.shields.io/github/go-mod/go-version/Azure/kaito) +![GitHub go.mod Go version](https://img.shields.io/github/go-mod/go-version/kaito-project/kaito) [![codecov](https://codecov.io/gh/Azure/kaito/graph/badge.svg?token=XAQLLPB2AR)](https://codecov.io/gh/Azure/kaito) | ![notification](docs/img/bell.svg) What is NEW! | diff --git a/config/manager/kustomization.yaml b/config/manager/kustomization.yaml index 324aa4752..c49c54ec2 100644 --- a/config/manager/kustomization.yaml +++ b/config/manager/kustomization.yaml @@ -4,5 +4,5 @@ apiVersion: kustomize.config.k8s.io/v1beta1 kind: Kustomization images: - name: controller - newName: ghcr.io/azure//kaito + newName: ghcr.io/kaito-project/kaito/workspace newTag: latest diff --git a/docs/How-to-use-kaito-in-aks-arc.md b/docs/How-to-use-kaito-in-aks-arc.md index 2ac678e68..abc12267b 100644 --- a/docs/How-to-use-kaito-in-aks-arc.md +++ b/docs/How-to-use-kaito-in-aks-arc.md @@ -6,7 +6,7 @@ AKS Arc, or Azure Kubernetes Service (AKS) on Azure Arc, is a service that exten Follow the workflow below to enable this feature. ## Supported Models -Currently KAITO supports models such as Falcon, Phi2, Phi3, Llama2, Llama2Chat, Mistral. Please refer to KAITO’s [readme](https://github.com/Azure/kaito/blob/main/presets/README.md) file for the latest models. +Currently KAITO supports models such as Falcon, Phi2, Phi3, Llama2, Llama2Chat, Mistral. Please refer to KAITO’s [readme](https://github.com/kaito-project/kaito/blob/main/presets/README.md) file for the latest models. ## Prerequisite 1. Before you begin, please make sure you have the following details from your infrastructure administrator: diff --git a/docs/custom-model-integration/reference-image-deployment.yaml b/docs/custom-model-integration/reference-image-deployment.yaml index eabec20ab..c3bb75171 100644 --- a/docs/custom-model-integration/reference-image-deployment.yaml +++ b/docs/custom-model-integration/reference-image-deployment.yaml @@ -12,7 +12,7 @@ inference: spec: containers: - name: custom-llm-container - image: ghcr.io/azure/kaito/llm-reference-preset:latest + image: ghcr.io/kaito-project/kaito/llm-reference-preset:latest command: ["accelerate"] args: - "launch" diff --git a/docs/rag-todos.yaml b/docs/rag-todos.yaml new file mode 100644 index 000000000..48cfdfc6c --- /dev/null +++ b/docs/rag-todos.yaml @@ -0,0 +1,53 @@ +apiVersion: kaito.sh/v1alpha1 +kind: RAG_Workspace +metadata: + name: random + +resources: + - instanceType: "Standard_NC12s_v3" + labelSelector: + matchLabels: + apps: RAG +rag: + index: # Dataset input + # Optional + storage: # Need to handle following: azure, aws, (gcp?), postgresql, data via api + # Example #1 + AzureCosmosDB: URI + secret: # Auth (CSI Secret Store) + # Example #2 + AWSDocDB: URI + secret: # Auth (CSI Secret Store) + # Example #3 + # If blank use data via API and FAISS + # Example #4 + # Perssitent Volume - local files (SimpleDirectoryReader) + query: # FAISS (Take out of CRD and put in POST Request) + search_method: "l2" # Voronoi Search, product search + + models: + llm: + endpoint: "URL" # Service Endpoint + # -- OR -- + secret: # OpenAI Secret (Prorjected Volume) + + + embedding_model: + endpoint: "URL" # Service Endpoint - need to add presets for embedding + # -- OR -- + secret: # OpenAI Secret (Prorjected Volume) + # -- OR -- + hf_model: + - name: "BAAI/bge-small-en-v1.5" # model_id + token: # Optional + remote: false # can also run remotely + + + + + +Whole RAG workflow runs on one node +POST Request for handling Indexing Uses CRD information for Storage Info (Optional) + + + diff --git a/terraform/kaito.tf b/terraform/kaito.tf index 0468f5e64..3ef4cbbc0 100644 --- a/terraform/kaito.tf +++ b/terraform/kaito.tf @@ -26,7 +26,7 @@ resource "azurerm_federated_identity_credential" "kaito" { # Install the gpu-provisioner chart resource "helm_release" "gpu_provisioner" { name = "gpu-provisioner" - chart = "https://raw.githubusercontent.com/Azure/kaito/refs/heads/gh-pages/charts/kaito/gpu-provisioner-${var.kaito_gpu_provisioner_version}.tgz" + chart = "https://raw.githubusercontent.com/kaito-project/kaito/refs/heads/gh-pages/charts/kaito/gpu-provisioner-${var.kaito_gpu_provisioner_version}.tgz" namespace = "gpu-provisioner" create_namespace = true @@ -48,7 +48,7 @@ resource "helm_release" "gpu_provisioner" { # Install the kaito-workspace chart resource "helm_release" "kaito_workspace" { name = "kaito-workspace" - chart = "https://raw.githubusercontent.com/Azure/kaito/refs/heads/gh-pages/charts/kaito/workspace-${var.kaito_workspace_version}.tgz" + chart = "https://raw.githubusercontent.com/kaito-project/kaito/refs/heads/gh-pages/charts/kaito/workspace-${var.kaito_workspace_version}.tgz" namespace = "kaito-workspace" create_namespace = true } From f8429f645a246b41877a3200edaf1030eda19352 Mon Sep 17 00:00:00 2001 From: ishaansehgal99 Date: Wed, 8 Jan 2025 13:36:12 -0800 Subject: [PATCH 2/2] fix: Address misnamed paths --- docs/rag-todos.yaml | 53 --------------------------------------------- 1 file changed, 53 deletions(-) delete mode 100644 docs/rag-todos.yaml diff --git a/docs/rag-todos.yaml b/docs/rag-todos.yaml deleted file mode 100644 index 48cfdfc6c..000000000 --- a/docs/rag-todos.yaml +++ /dev/null @@ -1,53 +0,0 @@ -apiVersion: kaito.sh/v1alpha1 -kind: RAG_Workspace -metadata: - name: random - -resources: - - instanceType: "Standard_NC12s_v3" - labelSelector: - matchLabels: - apps: RAG -rag: - index: # Dataset input - # Optional - storage: # Need to handle following: azure, aws, (gcp?), postgresql, data via api - # Example #1 - AzureCosmosDB: URI - secret: # Auth (CSI Secret Store) - # Example #2 - AWSDocDB: URI - secret: # Auth (CSI Secret Store) - # Example #3 - # If blank use data via API and FAISS - # Example #4 - # Perssitent Volume - local files (SimpleDirectoryReader) - query: # FAISS (Take out of CRD and put in POST Request) - search_method: "l2" # Voronoi Search, product search - - models: - llm: - endpoint: "URL" # Service Endpoint - # -- OR -- - secret: # OpenAI Secret (Prorjected Volume) - - - embedding_model: - endpoint: "URL" # Service Endpoint - need to add presets for embedding - # -- OR -- - secret: # OpenAI Secret (Prorjected Volume) - # -- OR -- - hf_model: - - name: "BAAI/bge-small-en-v1.5" # model_id - token: # Optional - remote: false # can also run remotely - - - - - -Whole RAG workflow runs on one node -POST Request for handling Indexing Uses CRD information for Storage Info (Optional) - - -