opendatahub-io
diff --git a/‎packages/gen-ai/bff/internal/api/aaa_vectorstores_handler_test.go‎
Lines changed: 2 additions & 2 deletions b/‎packages/gen-ai/bff/internal/api/aaa_vectorstores_handler_test.go‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎packages/gen-ai/bff/internal/api/external_vectorstores_handler_test.go‎
Lines changed: 2 additions & 2 deletions b/‎packages/gen-ai/bff/internal/api/external_vectorstores_handler_test.go‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎packages/gen-ai/bff/internal/api/lsd_handler_test.go‎
Lines changed: 161 additions & 0 deletions b/‎packages/gen-ai/bff/internal/api/lsd_handler_test.go‎
Lines changed: 161 additions & 0 deletions
diff --git a/‎packages/gen-ai/bff/internal/api/lsd_install_handler.go‎
Lines changed: 1 addition & 1 deletion b/‎packages/gen-ai/bff/internal/api/lsd_install_handler.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/gen-ai/bff/internal/integrations/kubernetes/client.go‎
Lines changed: 1 addition & 1 deletion b/‎packages/gen-ai/bff/internal/integrations/kubernetes/client.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/base_testenv.go‎
Lines changed: 1 addition & 1 deletion b/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/base_testenv.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/testdata/vector_stores.yaml‎
Lines changed: 18 additions & 0 deletions b/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/testdata/vector_stores.yaml‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/token_k8s_client_mock.go‎
Lines changed: 8 additions & 2 deletions b/‎packages/gen-ai/bff/internal/integrations/kubernetes/k8smocks/token_k8s_client_mock.go‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎packages/gen-ai/bff/internal/integrations/kubernetes/llamastack_config.go‎
Lines changed: 35 additions & 30 deletions b/‎packages/gen-ai/bff/internal/integrations/kubernetes/llamastack_config.go‎
Lines changed: 35 additions & 30 deletions
@@ -71,7 +71,7 @@ var _ = Describe("VectorStoresAAHandler", func() {
 		err = json.Unmarshal(body, &response)
 		require.NoError(t, err)
 
-		assert.Len(t, response.Data, 3, "Should return 3 vector stores from the ConfigMap")
+		assert.Len(t, response.Data, 4, "Should return 4 vector stores from the ConfigMap")
 
 		for _, store := range response.Data {
 			assert.NotEmpty(t, store.VectorStoreID, "Store should have a vector_store_id")
@@ -108,7 +108,7 @@ var _ = Describe("VectorStoresAAHandler", func() {
 		err = json.Unmarshal(body, &response)
 		require.NoError(t, err)
 
-		assert.Len(t, response.Data, 3, "mock-test-namespace-1 should have the same 3 vector stores from its ConfigMap")
+		assert.Len(t, response.Data, 4, "mock-test-namespace-1 should have the same 4 vector stores from its ConfigMap")
 	})
 
 	It("should not include ConfigMap metadata in the response", func() {
 
@@ -72,8 +72,8 @@ var _ = Describe("ExternalVectorStoresListHandler", func() {
 		err = json.Unmarshal(body, &response)
 		require.NoError(t, err)
 
-		assert.Equal(t, 3, response.Data.TotalCount, "Should return 3 vector stores")
-		assert.Equal(t, 3, len(response.Data.VectorStores))
+		assert.Equal(t, 4, response.Data.TotalCount, "Should return 4 vector stores")
+		assert.Equal(t, 4, len(response.Data.VectorStores))
 
 		for _, store := range response.Data.VectorStores {
 			assert.NotEmpty(t, store.VectorStoreID, "Store should have a vector_store_id")
 
@@ -671,6 +671,167 @@ var _ = Describe("LlamaStackDistributionInstallHandlerWithMaaSModels", func() {
 	})
 })
 
+var _ = Describe("LlamaStackDistributionInstallHandlerWithVectorStores", func() {
+	var app App
+
+	BeforeEach(func() {
+		k8sFactory, err := k8smocks.NewTokenClientFactory(testK8sClient, testCfg, slog.Default())
+		require.NoError(GinkgoT(), err)
+
+		app = App{
+			config: config.EnvConfig{
+				Port: 4000,
+			},
+			logger:                  slog.Default(),
+			kubernetesClientFactory: k8sFactory,
+			repositories:            repositories.NewRepositories(),
+		}
+	})
+
+	It("should install LSD successfully with empty vector_stores", func() {
+		t := GinkgoT()
+		namespace := fmt.Sprintf("vs-empty-test-%d", time.Now().UnixNano())
+		ctx := context.Background()
+
+		requestBody := map[string]interface{}{
+			"models": []map[string]interface{}{
+				{"model_name": "llama-2-7b-chat", "model_source_type": "maas"},
+			},
+			"vector_stores": []interface{}{},
+		}
+		jsonBody, err := json.Marshal(requestBody)
+		require.NoError(t, err)
+
+		req, err := http.NewRequest(http.MethodPost, "/gen-ai/api/v1/llamastack-distribution/install", bytes.NewReader(jsonBody))
+		require.NoError(t, err)
+		req.Header.Set("Content-Type", "application/json")
+
+		ctx = context.WithValue(ctx, constants.NamespaceQueryParameterKey, namespace)
+		ctx = context.WithValue(ctx, constants.RequestIdentityKey, &integrations.RequestIdentity{Token: "FAKE_BEARER_TOKEN"})
+		ctx = context.WithValue(ctx, constants.MaaSClientKey, maasmocks.NewMockMaaSClient())
+		req = req.WithContext(ctx)
+
+		rr := httptest.NewRecorder()
+		app.LlamaStackDistributionInstallHandler(rr, req, nil)
+
+		assert.Equal(t, http.StatusOK, rr.Code)
+		var response map[string]interface{}
+		err = json.Unmarshal(rr.Body.Bytes(), &response)
+		assert.NoError(t, err)
+		_, hasData := response["data"]
+		assert.True(t, hasData)
+	})
+
+	It("should install LSD with a valid vector store", func() {
+		t := GinkgoT()
+		// mock-test-namespace-1 has gen-ai-aa-vector-stores ConfigMap pre-seeded.
+		namespace := "mock-test-namespace-1"
+		ctx := context.Background()
+		cleanupTestNamespace(ctx, namespace)
+
+		requestBody := map[string]interface{}{
+			"models": []map[string]interface{}{
+				{"model_name": "llama-2-7b-chat", "model_source_type": "maas"},
+			},
+			"vector_stores": []map[string]interface{}{
+				{"vector_store_id": "vs_4c4b74e3-30ac-4e46-9057-213154f83dba"},
+			},
+		}
+		jsonBody, err := json.Marshal(requestBody)
+		require.NoError(t, err)
+
+		req, err := http.NewRequest(http.MethodPost, "/gen-ai/api/v1/llamastack-distribution/install", bytes.NewReader(jsonBody))
+		require.NoError(t, err)
+		req.Header.Set("Content-Type", "application/json")
+
+		ctx = context.WithValue(ctx, constants.NamespaceQueryParameterKey, namespace)
+		ctx = context.WithValue(ctx, constants.RequestIdentityKey, &integrations.RequestIdentity{Token: "FAKE_BEARER_TOKEN"})
+		ctx = context.WithValue(ctx, constants.MaaSClientKey, maasmocks.NewMockMaaSClient())
+		req = req.WithContext(ctx)
+
+		rr := httptest.NewRecorder()
+		app.LlamaStackDistributionInstallHandler(rr, req, nil)
+
+		body, _ := io.ReadAll(rr.Result().Body)
+		t.Logf("Response: %s", string(body))
+		assert.Equal(t, http.StatusOK, rr.Code)
+	})
+
+	It("should return 400 when vector_store_id is not found in ConfigMap", func() {
+		t := GinkgoT()
+		namespace := "mock-test-namespace-1"
+		ctx := context.Background()
+		cleanupTestNamespace(ctx, namespace)
+
+		requestBody := map[string]interface{}{
+			"models": []map[string]interface{}{
+				{"model_name": "llama-2-7b-chat", "model_source_type": "maas"},
+			},
+			"vector_stores": []map[string]interface{}{
+				{"vector_store_id": "nonexistent-store"},
+			},
+		}
+		jsonBody, err := json.Marshal(requestBody)
+		require.NoError(t, err)
+
+		req, err := http.NewRequest(http.MethodPost, "/gen-ai/api/v1/llamastack-distribution/install", bytes.NewReader(jsonBody))
+		require.NoError(t, err)
+		req.Header.Set("Content-Type", "application/json")
+
+		ctx = context.WithValue(ctx, constants.NamespaceQueryParameterKey, namespace)
+		ctx = context.WithValue(ctx, constants.RequestIdentityKey, &integrations.RequestIdentity{Token: "FAKE_BEARER_TOKEN"})
+		ctx = context.WithValue(ctx, constants.MaaSClientKey, maasmocks.NewMockMaaSClient())
+		req = req.WithContext(ctx)
+
+		rr := httptest.NewRecorder()
+		app.LlamaStackDistributionInstallHandler(rr, req, nil)
+
+		assert.Equal(t, http.StatusBadRequest, rr.Code)
+		var response map[string]interface{}
+		err = json.Unmarshal(rr.Body.Bytes(), &response)
+		assert.NoError(t, err)
+		errorMap, _ := response["error"].(map[string]interface{})
+		assert.Contains(t, errorMap["message"], "nonexistent-store")
+	})
+
+	It("should return 400 when vector stores ConfigMap is absent from the namespace", func() {
+		t := GinkgoT()
+		// Use a fresh namespace that has no pre-seeded ConfigMap.
+		namespace := fmt.Sprintf("vs-no-configmap-%d", time.Now().UnixNano())
+		ctx := context.Background()
+
+		requestBody := map[string]interface{}{
+			"models": []map[string]interface{}{
+				{"model_name": "llama-2-7b-chat", "model_source_type": "maas"},
+			},
+			"vector_stores": []map[string]interface{}{
+				{"vector_store_id": "vs_4c4b74e3-30ac-4e46-9057-213154f83dba"},
+			},
+		}
+		jsonBody, err := json.Marshal(requestBody)
+		require.NoError(t, err)
+
+		req, err := http.NewRequest(http.MethodPost, "/gen-ai/api/v1/llamastack-distribution/install", bytes.NewReader(jsonBody))
+		require.NoError(t, err)
+		req.Header.Set("Content-Type", "application/json")
+
+		ctx = context.WithValue(ctx, constants.NamespaceQueryParameterKey, namespace)
+		ctx = context.WithValue(ctx, constants.RequestIdentityKey, &integrations.RequestIdentity{Token: "FAKE_BEARER_TOKEN"})
+		ctx = context.WithValue(ctx, constants.MaaSClientKey, maasmocks.NewMockMaaSClient())
+		req = req.WithContext(ctx)
+
+		rr := httptest.NewRecorder()
+		app.LlamaStackDistributionInstallHandler(rr, req, nil)
+
+		assert.Equal(t, http.StatusBadRequest, rr.Code)
+		var response map[string]interface{}
+		err = json.Unmarshal(rr.Body.Bytes(), &response)
+		assert.NoError(t, err)
+		errorMap, _ := response["error"].(map[string]interface{})
+		assert.Contains(t, errorMap["message"], "gen-ai-aa-vector-stores")
+	})
+})
+
 var _ = Describe("LlamaStackDistributionDeleteHandler", func() {
 	var app App
 
 
@@ -84,7 +84,7 @@ func (app *App) LlamaStackDistributionInstallHandler(w http.ResponseWriter, r *h
 
 	// Pass the InstallModel structs directly to the repository
 	// enableGuardrails - if true, safety providers with shields will be configured for all models
-	response, err := app.repositories.LlamaStackDistribution.InstallLlamaStackDistribution(client, ctx, identity, namespace, installRequest.Models, installRequest.EnableGuardrails, maasClient)
+	response, err := app.repositories.LlamaStackDistribution.InstallLlamaStackDistribution(client, ctx, identity, namespace, installRequest.Models, installRequest.EnableGuardrails, installRequest.VectorStores, maasClient)
 	if err != nil {
 		app.badRequestResponse(w, r, err)
 		return
 
@@ -33,7 +33,7 @@ type KubernetesClientInterface interface {
 	// LlamaStack Distribution
 	GetLlamaStackDistributions(ctx context.Context, identity *integrations.RequestIdentity, namespace string) (*lsdapi.LlamaStackDistributionList, error)
 	CanListLlamaStackDistributions(ctx context.Context, identity *integrations.RequestIdentity, namespace string) (bool, error)
-	InstallLlamaStackDistribution(ctx context.Context, identity *integrations.RequestIdentity, namespace string, models []models.InstallModel, enableGuardrails bool, maasClient maas.MaaSClientInterface) (*lsdapi.LlamaStackDistribution, error)
+	InstallLlamaStackDistribution(ctx context.Context, identity *integrations.RequestIdentity, namespace string, installModels []models.InstallModel, enableGuardrails bool, vectorStores []models.InstallVectorStore, maasClient maas.MaaSClientInterface) (*lsdapi.LlamaStackDistribution, error)
 	DeleteLlamaStackDistribution(ctx context.Context, identity *integrations.RequestIdentity, namespace string, name string) (*lsdapi.LlamaStackDistribution, error)
 	GetModelProviderInfo(ctx context.Context, identity *integrations.RequestIdentity, namespace string, modelID string) (*types.ModelProviderInfo, error)
 
 
@@ -458,7 +458,7 @@ registered_resources:
       provider_id: vllm-inference-1
       model_type: llm
   shields: []
-  vector_dbs: []
+  vector_stores: []
   datasets: []
   scoring_fns: []
   benchmarks: []
 
@@ -39,6 +39,16 @@ providers:
       config:
         uri: http://milvus.vector.svc.cluster.local:19530
 
+    - provider_id: milvus-secure-provider
+      provider_type: remote::milvus
+      config:
+        uri: http://milvus-secure.vector.svc.cluster.local:19530
+        custom_gen_ai:
+          credentials:
+            secretRefs:
+              - name: milvus-credentials
+                key: token
+
 registered_resources:
   vector_stores:
     - provider_id: pgvector-provider
@@ -64,3 +74,11 @@ registered_resources:
       vector_store_name: "Code Vector Store (Milvus)"
       metadata:
         description: "Code embeddings for repository search"
+
+    - provider_id: milvus-secure-provider
+      vector_store_id: vs_c9e12f45-3b67-4d89-a012-3b4567890cde
+      embedding_model: ibm-granite/granite-embedding-125m-english
+      embedding_dimension: 768
+      vector_store_name: "Secure Knowledge Base (Milvus)"
+      metadata:
+        description: "Secure internal knowledge base with token auth"
@@ -384,7 +384,13 @@ func (m *TokenKubernetesClientMock) GetLlamaStackDistributions(ctx context.Conte
 	}, nil
 }
 
-func (m *TokenKubernetesClientMock) InstallLlamaStackDistribution(ctx context.Context, identity *integrations.RequestIdentity, namespace string, installModels []models.InstallModel, enableGuardrails bool, maasClient maas.MaaSClientInterface) (*lsdapi.LlamaStackDistribution, error) {
+func (m *TokenKubernetesClientMock) InstallLlamaStackDistribution(ctx context.Context, identity *integrations.RequestIdentity, namespace string, installModels []models.InstallModel, enableGuardrails bool, vectorStores []models.InstallVectorStore, maasClient maas.MaaSClientInterface) (*lsdapi.LlamaStackDistribution, error) {
+	if len(vectorStores) > 0 {
+		if _, err := m.LoadAndValidateVectorStores(ctx, identity, namespace, vectorStores); err != nil {
+			return nil, err
+		}
+	}
+
 	// Check if LSD already exists in the namespace
 	existingLSDList, err := m.GetLlamaStackDistributions(ctx, identity, namespace)
 	if err != nil {
@@ -604,7 +610,7 @@ registered_resources:
       provider_id: vllm-inference-1
       model_type: llm
 ` + shieldsSection + `
-  vector_dbs: []
+  vector_stores: []
   datasets: []
   scoring_fns: []
   benchmarks: []
 
@@ -62,13 +62,13 @@ type MetadataStore struct {
 }
 
 type RegisteredResources struct {
-	Models     []Model     `json:"models" yaml:"models"`
-	Shields    []Shield    `json:"shields" yaml:"shields"`
-	VectorDBs  []VectorDB  `json:"vector_dbs" yaml:"vector_dbs"`
-	Datasets   []Dataset   `json:"datasets" yaml:"datasets"`
-	ScoringFns []ScoringFn `json:"scoring_fns" yaml:"scoring_fns"`
-	Benchmarks []Benchmark `json:"benchmarks" yaml:"benchmarks"`
-	ToolGroups []ToolGroup `json:"tool_groups" yaml:"tool_groups"`
+	Models       []Model       `json:"models" yaml:"models"`
+	Shields      []Shield      `json:"shields" yaml:"shields"`
+	VectorStores []VectorStore `json:"vector_stores" yaml:"vector_stores"`
+	Datasets     []Dataset     `json:"datasets" yaml:"datasets"`
+	ScoringFns   []ScoringFn   `json:"scoring_fns" yaml:"scoring_fns"`
+	Benchmarks   []Benchmark   `json:"benchmarks" yaml:"benchmarks"`
+	ToolGroups   []ToolGroup   `json:"tool_groups" yaml:"tool_groups"`
 }
 
 type Storage struct {
@@ -229,12 +229,12 @@ func NewDefaultLlamaStackConfig() *LlamaStackConfig {
 		},
 		RegisteredResources: RegisteredResources{
 			// Ensure these serialize as `[]` (not `null`) when no values exist.
-			Models:     []Model{},
-			Shields:    []Shield{},
-			VectorDBs:  []VectorDB{},
-			Datasets:   []Dataset{},
-			ScoringFns: []ScoringFn{},
-			Benchmarks: []Benchmark{},
+			Models:       []Model{},
+			Shields:      []Shield{},
+			VectorStores: []VectorStore{},
+			Datasets:     []Dataset{},
+			ScoringFns:   []ScoringFn{},
+			Benchmarks:   []Benchmark{},
 			ToolGroups: []ToolGroup{
 				{
 					ToolGroupID: "builtin::rag",
@@ -351,7 +351,7 @@ func NewEmbeddingModel(modelID, providerID, providerModelID string, embeddingDim
 		ModelID:         modelID,
 		ProviderID:      providerID,
 		ProviderModelID: providerModelID,
-		ModelType:       "embedding",
+		ModelType:       string(models.ModelTypeEmbedding),
 		Metadata: map[string]interface{}{
 			"embedding_dimension": embeddingDimension,
 		},
@@ -363,7 +363,7 @@ func NewLLMModel(modelID, providerID string, displayName string) Model {
 	return Model{
 		ModelID:    modelID,
 		ProviderID: providerID,
-		ModelType:  "llm",
+		ModelType:  string(models.ModelTypeLLM),
 		Metadata: map[string]interface{}{
 			"display_name": displayName,
 		},
@@ -545,6 +545,11 @@ func (c *LlamaStackConfig) RegisterShield(shield Shield) {
 	c.RegisteredResources.Shields = append(c.RegisteredResources.Shields, shield)
 }
 
+// RegisterVectorStore adds a vector store to the registered resources.
+func (c *LlamaStackConfig) RegisterVectorStore(store VectorStore) {
+	c.RegisteredResources.VectorStores = append(c.RegisteredResources.VectorStores, store)
+}
+
 // GetModelProviderInfo extracts model provider information for a given model ID
 // This is a two-step process:
 // 1. Find the model in the Models section and get its provider_id
@@ -631,13 +636,15 @@ type Shield struct {
 	Metadata   map[string]interface{} `json:"metadata,omitempty" yaml:"metadata,omitempty"`
 }
 
-// VectorDB represents a vector database configuration
-type VectorDB struct {
-	DBID       string                 `json:"db_id" yaml:"db_id"`
-	Name       string                 `json:"name" yaml:"name"`
-	ProviderID string                 `json:"provider_id" yaml:"provider_id"`
-	Config     map[string]interface{} `json:"config" yaml:"config"`
-	Metadata   map[string]interface{} `json:"metadata,omitempty" yaml:"metadata,omitempty"`
+// VectorStore represents a vector store configuration in registered_resources
+type VectorStore struct {
+	VectorStoreID         string                 `json:"vector_store_id" yaml:"vector_store_id"`
+	EmbeddingModel        string                 `json:"embedding_model" yaml:"embedding_model"`
+	EmbeddingDimension    int                    `json:"embedding_dimension" yaml:"embedding_dimension"`
+	ProviderID            string                 `json:"provider_id,omitempty" yaml:"provider_id,omitempty"`
+	ProviderVectorStoreID string                 `json:"provider_vector_store_id,omitempty" yaml:"provider_vector_store_id,omitempty"`
+	VectorStoreName       string                 `json:"vector_store_name,omitempty" yaml:"vector_store_name,omitempty"`
+	Metadata              map[string]interface{} `json:"metadata,omitempty" yaml:"metadata,omitempty"`
 }
 
 // Dataset represents a dataset configuration
@@ -680,14 +687,12 @@ func NewShield(shieldID, shieldType, providerID string, config map[string]interf
 	}
 }
 
-// NewVectorDB creates a new VectorDB instance
-func NewVectorDB(dbID, name, providerID string, config map[string]interface{}) VectorDB {
-	return VectorDB{
-		DBID:       dbID,
-		Name:       name,
-		ProviderID: providerID,
-		Config:     config,
-		Metadata:   EmptyConfig(),
+// NewVectorStore creates a new VectorStore instance
+func NewVectorStore(vectorStoreID, embeddingModel string, embeddingDimension int) VectorStore {
+	return VectorStore{
+		VectorStoreID:      vectorStoreID,
+		EmbeddingModel:     embeddingModel,
+		EmbeddingDimension: embeddingDimension,
 	}
 }