11version : ' 2'
2- image_name : minimal-viable- llama-stack-configuration
2+ image_name : redhat-ai-dev- llama-stack
33
44apis :
5- - agents
6- - datasetio
7- - eval
8- - inference
9- - post_training
10- - safety
11- - scoring
12- - telemetry
13- - tool_runtime
14- - vector_io
5+ - agents
6+ - datasetio
7+ - eval
8+ - inference
9+ - post_training
10+ - safety
11+ - scoring
12+ - telemetry
13+ - tool_runtime
14+ - vector_io
1515benchmarks : []
1616container_image :
1717datasets : []
18- external_providers_dir : " /app-root/config/providers.d"
18+ external_providers_dir : ' /app-root/config/providers.d'
1919inference_store :
2020 db_path : .llama/distributions/ollama/inference_store.db
2121 type : sqlite
@@ -25,47 +25,47 @@ metadata_store:
2525 namespace :
2626 type : sqlite
2727models :
28- - model_id : sentence-transformers/all-mpnet-base-v2
29- metadata :
30- embedding_dimension : 768
31- model_type : embedding
32- provider_id : sentence-transformers
33- provider_model_id : " /app-root/embeddings_model"
28+ - model_id : sentence-transformers/all-mpnet-base-v2
29+ metadata :
30+ embedding_dimension : 768
31+ model_type : embedding
32+ provider_id : sentence-transformers
33+ provider_model_id : ' /app-root/embeddings_model'
3434providers :
3535 agents :
36- - config :
37- persistence_store :
38- db_path : .llama/distributions/ollama/agents_store.db
39- namespace :
40- type : sqlite
41- responses_store :
42- db_path : .llama/distributions/ollama/responses_store.db
43- type : sqlite
44- provider_id : meta-reference
45- provider_type : inline::meta-reference
36+ - config :
37+ persistence_store :
38+ db_path : .llama/distributions/ollama/agents_store.db
39+ namespace :
40+ type : sqlite
41+ responses_store :
42+ db_path : .llama/distributions/ollama/responses_store.db
43+ type : sqlite
44+ provider_id : meta-reference
45+ provider_type : inline::meta-reference
4646 datasetio :
47- - config :
48- kvstore :
49- db_path : .llama/distributions/ollama/huggingface_datasetio.db
50- namespace :
51- type : sqlite
52- provider_id : huggingface
53- provider_type : remote::huggingface
54- - config :
55- kvstore :
56- db_path : .llama/distributions/ollama/localfs_datasetio.db
57- namespace :
58- type : sqlite
59- provider_id : localfs
60- provider_type : inline::localfs
47+ - config :
48+ kvstore :
49+ db_path : .llama/distributions/ollama/huggingface_datasetio.db
50+ namespace :
51+ type : sqlite
52+ provider_id : huggingface
53+ provider_type : remote::huggingface
54+ - config :
55+ kvstore :
56+ db_path : .llama/distributions/ollama/localfs_datasetio.db
57+ namespace :
58+ type : sqlite
59+ provider_id : localfs
60+ provider_type : inline::localfs
6161 eval :
62- - config :
63- kvstore :
64- db_path : .llama/distributions/ollama/meta_reference_eval.db
65- namespace :
66- type : sqlite
67- provider_id : meta-reference
68- provider_type : inline::meta-reference
62+ - config :
63+ kvstore :
64+ db_path : .llama/distributions/ollama/meta_reference_eval.db
65+ namespace :
66+ type : sqlite
67+ provider_id : meta-reference
68+ provider_type : inline::meta-reference
6969 inference :
7070 - provider_id : ${env.ENABLE_VLLM:+vllm}
7171 provider_type : remote::vllm
@@ -91,123 +91,123 @@ providers:
9191 provider_type : inline::sentence-transformers
9292 config : {}
9393 post_training :
94- - config :
95- checkpoint_format : huggingface
96- device : cpu
97- distributed_backend :
98- dpo_output_dir : " . "
99- provider_id : huggingface
100- provider_type : inline::huggingface
94+ - config :
95+ checkpoint_format : huggingface
96+ device : cpu
97+ distributed_backend :
98+ dpo_output_dir : ' . '
99+ provider_id : huggingface
100+ provider_type : inline::huggingface
101101 safety :
102- - config :
103- excluded_categories : []
104- provider_id : llama-guard
105- provider_type : inline::llama-guard
106- - provider_id : lightspeed_question_validity
107- provider_type : inline::lightspeed_question_validity
108- config :
109- model_id : ${env.VALIDATION_PROVIDER:=vllm}/${env.VALIDATION_MODEL_NAME}
110- model_prompt : |-
111- Instructions:
102+ - config :
103+ excluded_categories : []
104+ provider_id : llama-guard
105+ provider_type : inline::llama-guard
106+ - provider_id : lightspeed_question_validity
107+ provider_type : inline::lightspeed_question_validity
108+ config :
109+ model_id : ${env.VALIDATION_PROVIDER:=vllm}/${env.VALIDATION_MODEL_NAME}
110+ model_prompt : |-
111+ Instructions:
112112
113- You area question classification tool. You are an expert in the following categories:
114- - Backstage
115- - Red Hat Developer Hub (RHDH)
116- - Kubernetes
117- - Openshift
118- - CI/CD
119- - GitOps
120- - Pipelines
121- - Developer Portals
122- - Deployments
123- - Software Catalogs
124- - Software Templates
125- - Tech Docs
113+ You area question classification tool. You are an expert in the following categories:
114+ - Backstage
115+ - Red Hat Developer Hub (RHDH)
116+ - Kubernetes
117+ - Openshift
118+ - CI/CD
119+ - GitOps
120+ - Pipelines
121+ - Developer Portals
122+ - Deployments
123+ - Software Catalogs
124+ - Software Templates
125+ - Tech Docs
126126
127- Your job is to determine if a user's question is related to the categories you are an expert in. If the question is related to those categories, \
128- or any features that may be related to those categories, you will answer with ${allowed}.
127+ Your job is to determine if a user's question is related to the categories you are an expert in. If the question is related to those categories, \
128+ or any features that may be related to those categories, you will answer with ${allowed}.
129129
130- If a question is not related to your expert categories, answer with ${rejected}.
130+ If a question is not related to your expert categories, answer with ${rejected}.
131131
132- You do not need to explain your answer.
132+ You do not need to explain your answer.
133133
134- Below are some example questions:
135- Example Question:
136- Why is the sky blue?
137- Example Response:
138- ${rejected}
134+ Below are some example questions:
135+ Example Question:
136+ Why is the sky blue?
137+ Example Response:
138+ ${rejected}
139139
140- Example Question:
141- Can you help configure my cluster to automatically scale?
142- Example Response:
143- ${allowed}
140+ Example Question:
141+ Can you help configure my cluster to automatically scale?
142+ Example Response:
143+ ${allowed}
144144
145- Example Question:
146- How do I create import an existing software template in Backstage?
147- Example Response:
148- ${allowed}
145+ Example Question:
146+ How do I create import an existing software template in Backstage?
147+ Example Response:
148+ ${allowed}
149149
150- Example Question:
151- How do I accomplish a task in RHDH?
152- Example Response:
153- ${allowed}
150+ Example Question:
151+ How do I accomplish a task in RHDH?
152+ Example Response:
153+ ${allowed}
154154
155- Example Question:
156- How do I explore a component in RHDH catalog?
157- Example Response:
158- ${allowed}
155+ Example Question:
156+ How do I explore a component in RHDH catalog?
157+ Example Response:
158+ ${allowed}
159159
160- Example Question:
161- How can I integrate GitOps into my pipeline?
162- Example Response:
163- ${allowed}
160+ Example Question:
161+ How can I integrate GitOps into my pipeline?
162+ Example Response:
163+ ${allowed}
164164
165- Question:
166- ${message}
167- Response:
168- invalid_question_response : |-
169- Hi, I'm the Red Hat Developer Hub Lightspeed assistant, I can help you with questions about Red Hat Developer Hub or Backstage.
170- Please ensure your question is about these topics, and feel free to ask again!
165+ Question:
166+ ${message}
167+ Response:
168+ invalid_question_response : |-
169+ Hi, I'm the Red Hat Developer Hub Lightspeed assistant, I can help you with questions about Red Hat Developer Hub or Backstage.
170+ Please ensure your question is about these topics, and feel free to ask again!
171171 scoring :
172- - config : {}
173- provider_id : basic
174- provider_type : inline::basic
175- - config : {}
176- provider_id : llm-as-judge
177- provider_type : inline::llm-as-judge
178- - config :
179- openai_api_key : ' ********'
180- provider_id : braintrust
181- provider_type : inline::braintrust
172+ - config : {}
173+ provider_id : basic
174+ provider_type : inline::basic
175+ - config : {}
176+ provider_id : llm-as-judge
177+ provider_type : inline::llm-as-judge
178+ - config :
179+ openai_api_key : ' ********'
180+ provider_id : braintrust
181+ provider_type : inline::braintrust
182182 telemetry :
183- - config :
184- service_name : ' lightspeed-stack-telemetry'
185- sinks : sqlite
186- sqlite_db_path : .llama/distributions/ollama/trace_store.db
187- provider_id : meta-reference
188- provider_type : inline::meta-reference
183+ - config :
184+ service_name : ' lightspeed-stack-telemetry'
185+ sinks : sqlite
186+ sqlite_db_path : .llama/distributions/ollama/trace_store.db
187+ provider_id : meta-reference
188+ provider_type : inline::meta-reference
189189 tool_runtime :
190- - provider_id : model-context-protocol
191- provider_type : remote::model-context-protocol
192- config : {}
193- - provider_id : rag-runtime
194- provider_type : inline::rag-runtime
195- config : {}
190+ - provider_id : model-context-protocol
191+ provider_type : remote::model-context-protocol
192+ config : {}
193+ - provider_id : rag-runtime
194+ provider_type : inline::rag-runtime
195+ config : {}
196196 vector_io :
197- - config :
198- kvstore :
199- db_path : .llama/distributions/ollama/faiss_store.db
200- namespace :
201- type : sqlite
202- provider_id : faiss
203- provider_type : inline::faiss
204- - provider_id : rhdh-docs
205- provider_type : inline::faiss
206- config :
207- kvstore :
208- type : sqlite
209- namespace :
210- db_path : /app-root/vector_db/rhdh_product_docs/1.8/faiss_store.db
197+ - config :
198+ kvstore :
199+ db_path : .llama/distributions/ollama/faiss_store.db
200+ namespace :
201+ type : sqlite
202+ provider_id : faiss
203+ provider_type : inline::faiss
204+ - provider_id : rhdh-docs
205+ provider_type : inline::faiss
206+ config :
207+ kvstore :
208+ type : sqlite
209+ namespace :
210+ db_path : /app-root/vector_db/rhdh_product_docs/1.8/faiss_store.db
211211scoring_fns : []
212212server :
213213 auth :
@@ -218,14 +218,14 @@ server:
218218 tls_certfile :
219219 tls_keyfile :
220220shields :
221- - shield_id : lightspeed_question_validity-shield
222- provider_id : lightspeed_question_validity
221+ - shield_id : lightspeed_question_validity-shield
222+ provider_id : lightspeed_question_validity
223223tool_groups :
224- - provider_id : rag-runtime
225- toolgroup_id : builtin::rag
226- description : " Only use for questions specifically about Red Hat Developer Hub (RHDH). Searches technical documentation for RHDH installation, discovery, configuration, release, upgrade, control access, integration, observability, and extending with plugins. Do not use for any other topic outside RHDH."
224+ - provider_id : rag-runtime
225+ toolgroup_id : builtin::rag
226+ description : ' Only use for questions specifically about Red Hat Developer Hub (RHDH). Searches technical documentation for RHDH installation, discovery, configuration, release, upgrade, control access, integration, observability, and extending with plugins. Do not use for any other topic outside RHDH.'
227227vector_dbs :
228- - embedding_dimension : 768
229- embedding_model : sentence-transformers/all-mpnet-base-v2
230- provider_id : rhdh-docs
231- vector_db_id : rhdh-product-docs-1_8
228+ - embedding_dimension : 768
229+ embedding_model : sentence-transformers/all-mpnet-base-v2
230+ provider_id : rhdh-docs
231+ vector_db_id : rhdh-product-docs-1_8
0 commit comments