feat: llama stack inference provider config file section

raptorsun · raptorsun · commit 0b3ce2f3e910 · 2025-10-28T16:03:00.000+01:00
Signed-off-by: Haoyu Sun &lt;hasun@redhat.com&gt;
diff --git a/internal/controller/constants.go b/internal/controller/constants.go
@@ -112,10 +112,24 @@ const (
 	LLMProviderHashStateCacheKey = "llmprovider-hash"
 	// AzureOpenAIType is the name of the Azure OpenAI provider type
 	AzureOpenAIType = "azure_openai"
+	// OpenAIType is the name of the OpenAI provider type
+	OpenAIType = "openai"
+	// WatsonXType is the name of the Watson X provider type
+	WatsonXType = "watsonx"
+	// LlamaStackOpenAIType is the name of the OpenAI provider type for the llama stack
+	LlamaStackOpenAIType = "remote::openai"
+	// LlamaStackAzureOpenAIType is the name of the Azure OpenAI provider type for the llama stack
+	LlamaStackAzureOpenAIType = "remote::azure_openai"
+	// LlamaStackWatsonXType is the name of the Watson X provider type for the llama stack
+	LlamaStackWatsonXType = "remote::watsonx"
 	// AdditionalCAHashStateCacheKey is the key of the hash value of the additional CA certificates in the state cache
 	AdditionalCAHashStateCacheKey = "additionalca-hash"
 	// DeploymentInProgress message
 	DeploymentInProgress = "In Progress"
+	// LlamaStackConfigCmName is the name of the llama stack configuration configmap
+	LlamaStackConfigCmName = "llama-stack-config"
+	// LlamaStackConfigFilename is the name of the llama stack configuration file
+	LlamaStackConfigFilename = "llama-stack-config.yaml"
 
 	/*** console UI plugin ***/
 	// ConsoleUIConfigMapName is the name of the console UI nginx configmap
@@ -289,4 +303,14 @@ ssl_ca_file = '/etc/certs/cm-olspostgresca/service-ca.crt'
 	MCPSECRETDATAPATH = "header"
 	// LSCAppServerActivatorCmName is the name of the LSC app server activator configmap
 	LSCAppServerActivatorCmName = "lsc-app-server-activator"
+
+	/*** llama stack configuration ***/
+	// LlamaStackConfigVersion is the version of the llama stack configuration file, currently only version 2 is supported
+	LlamaStackConfigVersion = "2"
+	// OpenAIAPIKeyEnvVar is the environment variable for the OpenAI API key
+	OpenAIAPIKeyEnvVar = "OPENAI_API_KEY"
+	// AzureOpenAIAPIKeyEnvVar is the environment variable for the Azure OpenAI API key
+	AzureOpenAIAPIKeyEnvVar = "AZURE_OPENAI_API_KEY"
+	// WatsonXAPIKeyEnvVar is the environment variable for the Watson X API key
+	WatsonXAPIKeyEnvVar = "WATSONX_API_KEY"
 )
diff --git a/internal/controller/llama_stack_types.go b/internal/controller/llama_stack_types.go
@@ -0,0 +1,94 @@
+package controller
+
+/*** Llama stack configuration ***/
+
+// LlamaStackConfig is the root structure of the llama stack configuration file
+type LlamaStackConfig struct {
+	// Version is the version of the llama stack configuration file, currently only version 2 is supported
+	Version string `json:"version"`
+	// Providers is the list of providers for the llama stack, it contains providers for each of the llama stack components
+	// such as inference, datasetio, etc.
+	Providers ProviderList `json:"providers"`
+}
+
+// ProviderList is the list of providers for the llama stack, it contains providers for each of the llama stack components
+// such as inference, datasetio, etc.
+// here is an example of the providers section of the llama stack configuration file:
+/*
+   providers:
+     agents:
+     - config:
+         persistence_store:
+           db_path: .llama/distributions/ollama/agents_store.db
+           namespace: null
+           type: sqlite
+         responses_store:
+           db_path: .llama/distributions/ollama/responses_store.db
+           type: sqlite
+       provider_id: meta-reference
+       provider_type: inline::meta-reference
+     datasetio:
+     - config:
+         kvstore:
+           db_path: .llama/distributions/ollama/huggingface_datasetio.db
+           namespace: null
+           type: sqlite
+       provider_id: huggingface
+       provider_type: remote::huggingface
+     - config:
+         kvstore:
+           db_path: .llama/distributions/ollama/localfs_datasetio.db
+           namespace: null
+           type: sqlite
+       provider_id: localfs
+       provider_type: inline::localfs
+     inference:
+       - provider_id: openai
+         provider_type: remote::openai
+         config:
+           api_key: ${env.OPENAI_API_KEY}
+*/
+type ProviderList struct {
+	Inference []InferenceProviderConfig `json:"inference"`
+
+	// todo: add other providers here
+}
+
+type InferenceProviderConfig struct {
+	// Provider ID is the unique identifier in the llama stack configuration
+	ProviderID string `json:"provider_id"`
+	// Provider Type is the type of the provider, this determines the underlyingtype of Config field below
+	ProviderType string `json:"provider_type"`
+	// Config is the provider specific configuration, can be one of the following:
+	// - InferenceProviderOpenAI
+	// - InferenceProviderAzureOpenAI
+	// - InferenceProviderWatsonX
+	Config interface{} `json:"config"`
+}
+
+/*** Inference provider configuration ***/
+
+// OpenAI inference provider configuration
+// https://llamastack.github.io/docs/providers/inference/remote_openai
+type InferenceProviderOpenAI struct {
+	APIKey  string `json:"api_key,omitempty"`
+	BaseURL string `json:"base_url,omitempty"`
+}
+
+// Azure OpenAI inference provider configuration
+// https://llamastack.github.io/docs/providers/inference/remote_azure_openai
+type InferenceProviderAzureOpenAI struct {
+	APIKey     string `json:"api_key,omitempty"`
+	APIBase    string `json:"api_base,omitempty"`
+	APIVersion string `json:"api_version,omitempty"`
+	APIType    string `json:"api_type,omitempty"`
+}
+
+// WatsonX inference provider configuration
+// https://llamastack.github.io/docs/providers/inference/remote_watsonx
+type InferenceProviderWatsonX struct {
+	APIKey    string `json:"api_key,omitempty"`
+	URL       string `json:"url,omitempty"`
+	ProjectID string `json:"project_id,omitempty"`
+	Timeout   int    `json:"timeout,omitempty"`
+}
diff --git a/internal/controller/lsc_app_server_assets.go b/internal/controller/lsc_app_server_assets.go
@@ -2,10 +2,12 @@ package controller
 
 import (
 	"context"
+	"fmt"
 
 	appsv1 "k8s.io/api/apps/v1"
 	corev1 "k8s.io/api/core/v1"
 	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"sigs.k8s.io/yaml"
 
 	olsv1alpha1 "github.com/openshift/lightspeed-operator/api/v1alpha1"
 )
@@ -62,3 +64,53 @@ func (r *OLSConfigReconciler) updateLSCDeployment(ctx context.Context, existingD
 
 	return nil
 }
+
+// todo: implement other fields for the llama stack configuration map
+// generateLlamaStackConfigMap generates the llama stack configuration map for the LSC app server
+func (r *OLSConfigReconciler) generateLlamaStackConfigFile(ctx context.Context, cr *olsv1alpha1.OLSConfig) (string, error) {
+	llamaStackConfig := &LlamaStackConfig{
+		Version: LlamaStackConfigVersion,
+	}
+
+	// inference providers
+	for _, provider := range cr.Spec.LLMConfig.Providers {
+
+		providerConfig := InferenceProviderConfig{
+			ProviderID: provider.Name,
+		}
+		switch provider.Type {
+		case AzureOpenAIType:
+			providerConfig.ProviderType = LlamaStackAzureOpenAIType
+			providerConfig.Config = &InferenceProviderAzureOpenAI{
+				// todo: add these environment variables to the podspec in generateLSCDeployment
+				APIKey:     fmt.Sprintf("${env.%s}", AzureOpenAIAPIKeyEnvVar),
+				APIBase:    provider.URL,
+				APIVersion: provider.APIVersion,
+				APIType:    "", // default api type is "azure" for Azure OpenAI
+			}
+			// warning: AzureDeploymentName is not supported by Llama stack yet
+		case OpenAIType:
+			providerConfig.ProviderType = LlamaStackOpenAIType
+			providerConfig.Config = &InferenceProviderOpenAI{
+				// todo: add these environment variables to the podspec in generateLSCDeployment
+				APIKey:  fmt.Sprintf("${env.%s}", OpenAIAPIKeyEnvVar),
+				BaseURL: provider.URL,
+			}
+		case WatsonXType:
+			providerConfig.ProviderType = LlamaStackWatsonXType
+			providerConfig.Config = &InferenceProviderWatsonX{
+				// todo: add these environment variables to the podspec in generateLSCDeployment
+				APIKey:    fmt.Sprintf("${env.%s}", WatsonXAPIKeyEnvVar),
+				URL:       provider.URL,
+				ProjectID: provider.WatsonProjectID,
+			}
+		}
+		llamaStackConfig.Providers.Inference = append(llamaStackConfig.Providers.Inference, providerConfig)
+	}
+
+	llamaStackConfigBytes, err := yaml.Marshal(llamaStackConfig)
+	if err != nil {
+		return "", fmt.Errorf("failed to generate llama stack configuration file %w", err)
+	}
+	return string(llamaStackConfigBytes), nil
+}
diff --git a/internal/controller/lsc_app_server_assets_test.go b/internal/controller/lsc_app_server_assets_test.go
@@ -75,4 +75,108 @@ var _ = Describe("LSC App server assets", Label("LSCBackend"), Ordered, func() {
 		})
 	})
 
+	Context("Llama stack config file generation", func() {
+		addAzureOpenAIProvider := func(cr *olsv1alpha1.OLSConfig) *olsv1alpha1.OLSConfig {
+			cr.Spec.LLMConfig.Providers = append(cr.Spec.LLMConfig.Providers, olsv1alpha1.ProviderSpec{
+				Name:       "testProviderAzureOpenAI",
+				URL:        testURL,
+				Type:       "azure_openai",
+				APIVersion: "testAzureVersion",
+			})
+			return cr
+		}
+
+		addOpenAIProvider := func(cr *olsv1alpha1.OLSConfig) *olsv1alpha1.OLSConfig {
+			cr.Spec.LLMConfig.Providers = append(cr.Spec.LLMConfig.Providers, olsv1alpha1.ProviderSpec{
+				Name: "testProviderOpenAI",
+				URL:  testURL,
+				Type: "openai",
+			})
+			return cr
+		}
+
+		addWatsonXProvider := func(cr *olsv1alpha1.OLSConfig) *olsv1alpha1.OLSConfig {
+			cr.Spec.LLMConfig.Providers = append(cr.Spec.LLMConfig.Providers, olsv1alpha1.ProviderSpec{
+				Name:            "testProviderWatsonX",
+				URL:             testURL,
+				Type:            "watsonx",
+				WatsonProjectID: "testProjectID",
+			})
+			return cr
+		}
+
+		BeforeEach(func() {
+			ctx = context.Background()
+			rOptions = &OLSConfigReconcilerOptions{
+				OpenShiftMajor:          "123",
+				OpenshiftMinor:          "456",
+				LightspeedServiceImage:  "lightspeed-service:latest",
+				OpenShiftMCPServerImage: "openshift-mcp-server:latest",
+				Namespace:               OLSNamespaceDefault,
+			}
+			r = &OLSConfigReconciler{
+				Options:    *rOptions,
+				logger:     logf.Log.WithName("olsconfig.reconciler"),
+				Client:     k8sClient,
+				Scheme:     k8sClient.Scheme(),
+				stateCache: make(map[string]string),
+			}
+			cr = getEmptyOLSConfigCR()
+		})
+
+		Describe("Inference Provider", func() {
+			It("should generate a valid llama stack config file for OpenAI provider", func() {
+				cr = addOpenAIProvider(cr)
+				llamaStackConfigFile, err := r.generateLlamaStackConfigFile(ctx, cr)
+				Expect(err).NotTo(HaveOccurred())
+				ExpectedConfigFile := `providers:
+  inference:
+  - config:
+      api_key: ${env.OPENAI_API_KEY}
+      base_url: https://testURL
+    provider_id: testProviderOpenAI
+    provider_type: remote::openai
+version: "2"
+`
+				Expect(llamaStackConfigFile).To(Equal(ExpectedConfigFile))
+			})
+
+			It("should generate a valid llama stack config file for Azure OpenAI provider", func() {
+				cr = addAzureOpenAIProvider(cr)
+				llamaStackConfigFile, err := r.generateLlamaStackConfigFile(ctx, cr)
+				Expect(err).NotTo(HaveOccurred())
+				Expect(llamaStackConfigFile).NotTo(BeEmpty())
+				ExpectedConfigFile := `providers:
+  inference:
+  - config:
+      api_base: https://testURL
+      api_key: ${env.AZURE_OPENAI_API_KEY}
+      api_version: testAzureVersion
+    provider_id: testProviderAzureOpenAI
+    provider_type: remote::azure_openai
+version: "2"
+`
+				Expect(llamaStackConfigFile).To(Equal(ExpectedConfigFile))
+			})
+
+			It("should generate a valid llama stack config file for Watson X provider", func() {
+				cr = addWatsonXProvider(cr)
+				llamaStackConfigFile, err := r.generateLlamaStackConfigFile(ctx, cr)
+				Expect(err).NotTo(HaveOccurred())
+				ExpectedConfigFile := `providers:
+  inference:
+  - config:
+      api_key: ${env.WATSONX_API_KEY}
+      project_id: testProjectID
+      url: https://testURL
+    provider_id: testProviderWatsonX
+    provider_type: remote::watsonx
+version: "2"
+`
+				Expect(llamaStackConfigFile).To(Equal(ExpectedConfigFile))
+			})
+		})
+
+		// TODO: Add more tests cases for once implementation is complete
+	})
 })