Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 1 addition & 2 deletions Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -36,9 +36,8 @@ help: ## Show this help screen
awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36m%-33s\033[0m %s\n", $$1, $$2}'
@echo ''

# TODO (Jdubrick): Replace reference to lightspeed-core/lightspeed-providers once bug is addressed.
update-question-validation:
curl -o ./config/providers.d/inline/safety/lightspeed_question_validity.yaml https://raw.githubusercontent.com/Jdubrick/lightspeed-providers/refs/heads/devai/resources/external_providers/inline/safety/lightspeed_question_validity.yaml
curl -o ./config/providers.d/inline/safety/lightspeed_question_validity.yaml https://raw.githubusercontent.com/lightspeed-core/lightspeed-providers/refs/tags/0.1.17/resources/external_providers/inline/safety/lightspeed_question_validity.yaml

$(VENV)/bin/activate: ./scripts/python-scripts/requirements.txt
python3 -m venv $(VENV)
Expand Down
6 changes: 5 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -127,7 +127,11 @@ Or if using the host network:
podman run -it -p 8321:8321 --env-file ./env/values.env --network host -v ./embeddings_model:/app-root/embeddings_model:Z -v ./vector_db/rhdh_product_docs:/app-root/vector_db/rhdh_product_docs:Z quay.io/redhat-ai-dev/llama-stack:latest
```

Latest Lightspeed Core developer image:
> [!WARNING]
> This repository is currently running Llama Stack v0.2.22. This version is incompatible with Llama Stack >= 0.3.x. Due to these limitations, the latest image we can consume from Lightspeed Core is `quay.io/lightspeed-core/lightspeed-stack:dev-20251208-f20efb9`.
>

Latest Lightspeed Core Developer Image:
```
quay.io/lightspeed-core/lightspeed-stack:dev-latest
```
Expand Down
8 changes: 4 additions & 4 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -7,10 +7,10 @@ dependencies = [
"fastapi>=0.115.6",
"uvicorn>=0.34.3",
"kubernetes>=30.1.0",
"llama-stack==0.2.18",
"llama-stack-client==0.2.18",
"llama-stack==0.2.22",
"llama-stack-client==0.2.22",
"ollama>=0.2.0",
"openai==1.99.9",
"openai>=1.100.0",
"rich>=14.0.0",
"cachetools>=6.1.0",
"prometheus-client>=0.22.1",
Expand All @@ -34,7 +34,7 @@ dependencies = [
"greenlet",
"torch",
"sentence-transformers>=5.0.0",
"lightspeed_stack_providers @ git+https://github.com/Jdubrick/lightspeed-providers.git@devai",
"lightspeed_stack_providers==0.1.17",
"pydantic>=2.10.6",
"httpx",
]
Expand Down
81 changes: 13 additions & 68 deletions run.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,18 +15,13 @@
# limitations under the License.
version: '2'
image_name: redhat-ai-dev-llama-stack

apis:
- agents
- datasetio
- eval
- inference
- post_training
- safety
- scoring
- telemetry
- tool_runtime
- vector_io
- files
benchmarks: []
container_image:
datasets: []
Expand Down Expand Up @@ -58,29 +53,6 @@ providers:
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
datasetio:
- config:
kvstore:
db_path: .llama/distributions/ollama/huggingface_datasetio.db
namespace:
type: sqlite
provider_id: huggingface
provider_type: remote::huggingface
- config:
kvstore:
db_path: .llama/distributions/ollama/localfs_datasetio.db
namespace:
type: sqlite
provider_id: localfs
provider_type: inline::localfs
eval:
- config:
kvstore:
db_path: .llama/distributions/ollama/meta_reference_eval.db
namespace:
type: sqlite
provider_id: meta-reference
provider_type: inline::meta-reference
inference:
- provider_id: ${env.ENABLE_VLLM:+vllm}
provider_type: remote::vllm
Expand All @@ -105,19 +77,7 @@ providers:
- provider_id: sentence-transformers
provider_type: inline::sentence-transformers
config: {}
post_training:
- config:
checkpoint_format: huggingface
device: cpu
distributed_backend:
dpo_output_dir: '.'
provider_id: huggingface
provider_type: inline::huggingface
safety:
- config:
excluded_categories: []
provider_id: llama-guard
provider_type: inline::llama-guard
- provider_id: lightspeed_question_validity
provider_type: inline::lightspeed_question_validity
config:
Expand Down Expand Up @@ -183,24 +143,6 @@ providers:
invalid_question_response: |-
Hi, I'm the Red Hat Developer Hub Lightspeed assistant, I can help you with questions about Red Hat Developer Hub or Backstage.
Please ensure your question is about these topics, and feel free to ask again!
scoring:
- config: {}
provider_id: basic
provider_type: inline::basic
- config: {}
provider_id: llm-as-judge
provider_type: inline::llm-as-judge
- config:
openai_api_key: '********'
provider_id: braintrust
provider_type: inline::braintrust
telemetry:
- config:
service_name: 'lightspeed-stack-telemetry'
sinks: sqlite
sqlite_db_path: .llama/distributions/ollama/trace_store.db
provider_id: meta-reference
provider_type: inline::meta-reference
tool_runtime:
- provider_id: model-context-protocol
provider_type: remote::model-context-protocol
Expand All @@ -209,20 +151,21 @@ providers:
provider_type: inline::rag-runtime
config: {}
vector_io:
- config:
kvstore:
db_path: .llama/distributions/ollama/faiss_store.db
namespace:
type: sqlite
provider_id: faiss
provider_type: inline::faiss
- provider_id: rhdh-docs
- provider_id: rhdh-product-docs-1_8
provider_type: inline::faiss
config:
kvstore:
type: sqlite
namespace:
db_path: /app-root/vector_db/rhdh_product_docs/1.8/faiss_store.db
files:
- provider_id: localfs
provider_type: inline::localfs
config:
storage_dir: /tmp/llama-stack-files
metadata_store:
type: sqlite
db_path: files_metadata.db
scoring_fns: []
server:
auth:
Expand All @@ -242,5 +185,7 @@ tool_groups:
vector_dbs:
- embedding_dimension: 768
embedding_model: sentence-transformers/all-mpnet-base-v2
provider_id: rhdh-docs
provider_id: rhdh-product-docs-1_8
vector_db_id: rhdh-product-docs-1_8
provider_vector_db_id: rhdh-product-docs-1_8
vector_store_id: rhdh-product-docs-1_8
59 changes: 25 additions & 34 deletions uv.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.