fix(deps): update auto merged updates (#880 )

Signed-off-by: Platform Engineering Bot <platform-engineering@redhat.com>
fix(deps): update auto merged updates (#879 )
2025-06-09 08:44:36 +03:00 · 2025-06-02 08:05:13 +03:00 · 2025-05-26 09:24:49 +03:00 · 2025-05-21 13:44:14 +02:00 · 2025-05-21 10:13:51 +02:00 · 2025-05-19 16:28:47 +02:00
355 changed files with 57681 additions and 1166 deletions
--- a/.github/renovate.json5
+++ b/.github/renovate.json5
@ -1,6 +0,0 @@
-{
-  "$schema": "https://docs.renovatebot.com/renovate-schema.json",
-  "extends": [
-    "github>platform-engineering-org/.github"
-  ]
-}
--- a/.github/workflows/README.md
+++ b/.github/workflows/README.md
@ -17,7 +17,7 @@ For a full list of the images we build check out or [quay organization](https://

 ## Testing frameworks

-Our testing frameworks are a bit different from our standard workflows. In terms of compute, some of these jobs run either AWS machines provisioned via terraform using secrets in the github repository, or customized github hosted action runners, as well as the standard ubuntu-22.04 github runners for jobs not requiring additional resources.
+Our testing frameworks are a bit different from our standard workflows. In terms of compute, some of these jobs run either AWS machines provisioned via terraform using secrets in the github repository, or customized github hosted action runners, as well as the standard ubuntu-24.04 github runners for jobs not requiring additional resources.

 These workflows start by checking out the [terraform-test-environment-module](https://github.com/containers/terraform-test-environment-module) repo, as well as the code in `containers/ai-lab-recipes` at the `main` branch. Then it will provision the terraform instance, install the correct ansible playbook requirements, and runs a coressponding playbook. Aditional actions may also be taken depending on the testing framework in question.

--- a/.github/workflows/chatbot.yaml
+++ b/.github/workflows/chatbot.yaml
@ -8,6 +8,8 @@ on:
      - ./recipes/common/Makefile.common
      - ./recipes/natural_language_processing/chatbot/**
      - .github/workflows/chatbot.yaml
+      - ./recipes/natural_language_processing/chatbot/app/**
+      - ./renovate.json
  push:
    branches:
      - main
@ -25,7 +27,7 @@ env:
 jobs:
  chatbot-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,13 +37,69 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
+
+      - name: Install opentelemetry dependencies
+        run: |
+          pip install --no-cache-dir opentelemetry-sdk opentelemetry-exporter-otlp opentelemetry-instrumentation
+
+      - name: Download OpenTelemetry Collector Contrib
+        run: |
+          wget https://github.com/open-telemetry/opentelemetry-collector-releases/releases/download/v0.103.0/otelcol-contrib_0.103.0_linux_amd64.tar.gz
+          tar -xvf otelcol-contrib_0.103.0_linux_amd64.tar.gz
+
+      - name: Write secrets to files
+        run: |
+          echo "${{ secrets.ROSA_OTEL_CACERT }}" > /tmp/ca.crt
+          echo "${{ secrets.ROSA_OTEL_SERVER_CRT }}" > /tmp/server.crt
+          echo "${{ secrets.ROSA_OTEL_SERVER_KEY }}" > /tmp/server.key
+
+      - name: Configure OpenTelemetry Collector
+        run: |
+          echo '
+            receivers:
+              otlp:
+                protocols:
+                  grpc:
+                  http:
+            exporters:
+              otlphttp:
+                endpoint: "${{ secrets.ROSA_OTEL_ENDPOINT }}"
+                tls:
+                  insecure: false
+                  cert_file: /tmp/server.crt
+                  key_file: /tmp/server.key
+                  ca_file: /tmp/ca.crt
+              debug:
+                verbosity: detailed
+            service:
+              pipelines:
+                traces:
+                  receivers: [otlp]
+                  exporters: [debug, otlphttp]
+          ' > otel-collector-config.yaml
+
+      - name: Run OpenTelemetry Collector
+        run: |
+          ./otelcol-contrib --config otel-collector-config.yaml > otel-collector.log 2>&1 &

      - name: Install qemu dependency
        run: |
          sudo apt-get update
          sudo apt-get install -y qemu-user-static

+      - name: Start job trace
+        run: |
+          export WORKFLOW_NAME="chatbot"
+          export JOB_NAME="chatbot-build-and-push"
+          export TRACE_ACTION="start"
+          python ci/trace-steps.py
+
      - name: Build Image
        id: build_image
        uses: redhat-actions/buildah-build@v2.13
@ -52,11 +110,6 @@ jobs:
          containerfiles: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app/Containerfile
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install Dependencies
        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
        run: make install
@ -86,3 +139,11 @@ jobs:
          image: ${{ steps.build_image.outputs.image }}
          tags: ${{ steps.build_image.outputs.tags }}
          registry: ${{ env.REGISTRY }}
+
+      - name: End job trace
+        run: |
+          export WORKFLOW_NAME="chatbot"
+          export JOB_NAME="chatbot-build-and-push"
+          export TRACE_ACTION="end"
+          python ci/trace-steps.py
+
--- a/.github/workflows/codegen.yaml
+++ b/.github/workflows/codegen.yaml
@ -25,7 +25,7 @@ env:
 jobs:
  codegen-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,7 +35,7 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -53,7 +53,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

--- a/.github/workflows/instructlab.yaml
+++ b/.github/workflows/instructlab.yaml
@ -43,7 +43,7 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
      
      - name: Build Image
        id: build_image
--- a/.github/workflows/manual_build_trigger.yaml
+++ b/.github/workflows/manual_build_trigger.yaml
@ -16,7 +16,7 @@ env:

 jobs:
  build-and-push-llamacpp-python-cuda-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -26,7 +26,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Build llamacpp_python cuda
        id: build_llamacpp_python_cuda
@ -54,7 +54,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_cuda.outputs.tags }}

  build-and-push-llamacpp-python-vulkan-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -64,7 +64,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -98,7 +98,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_vulkan.outputs.tags }}

  build-and-push-llamacpp-python-base-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -108,7 +108,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -141,7 +141,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_base.outputs.tags }}

  build-and-push-rag-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -151,7 +151,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -184,13 +184,13 @@ jobs:
          tags: ${{ steps.build_rag.outputs.tags }}

  build-and-push-chromadb-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -223,13 +223,13 @@ jobs:
          tags: ${{ steps.build_chromadb.outputs.tags }}

  build-and-push-codegen-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -263,13 +263,13 @@ jobs:
          tags: ${{ steps.build_codegen_image.outputs.tags }}

  build-and-push-chatbot-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -303,13 +303,13 @@ jobs:
          tags: ${{ steps.build_chatbot_image.outputs.tags }}

  build-and-push-summarizer-image:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
--- a/.github/workflows/mirror_repository.yaml
+++ b/.github/workflows/mirror_repository.yaml
@ -14,9 +14,9 @@ concurrency:
 jobs:
  mirror-repository:
    if: github.repository == 'containers/ai-lab-recipes'
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
        with:
          fetch-depth: 0

--- a/.github/workflows/model_converter.yaml
+++ b/.github/workflows/model_converter.yaml
@ -7,14 +7,14 @@ on:
    paths:
      - 'convert_models/**'
      - '!convert_models/README.md'
-      - '.github/workflows/model-converter.yaml'
+      - '.github/workflows/model_converter.yaml'
  push:
    branches:
      - main
    paths:
      - 'convert_models/**'
      - '!convert_models/README.md'
-      - '.github/workflows/model-converter.yaml'
+      - '.github/workflows/model_converter.yaml'
  
  workflow_dispatch:

@ -29,7 +29,7 @@ jobs:
      matrix:
        include:
          - platforms: linux/amd64,linux/arm64
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -39,7 +39,7 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
--- a/.github/workflows/model_servers.yaml
+++ b/.github/workflows/model_servers.yaml
@ -5,14 +5,18 @@ on:
    branches:
      - main
    paths:
-      - ./model_servers/**
+      - 'model_servers/**'
+      - 'models/Makefile'
      - .github/workflows/model_servers.yaml
  push:
    branches:
      - main
    paths:
-      - ./model_servers/
+      - 'model_servers/**'
+      - 'models/Makefile'
      - .github/workflows/model_servers.yaml
+    tags:
+      - '*'

  workflow_dispatch:

@ -32,19 +36,37 @@ jobs:
            directory: llamacpp_python
            platforms: linux/amd64,linux/arm64
            no_gpu: 1
-          - image_name: llamacpp_python_cuda
+          - image_name: llamacpp-python-cuda
            model: granite
            flavor: cuda
            directory: llamacpp_python
+            platforms: linux/amd64,linux/arm64
+            no_gpu: 0
+          - image_name: llamacpp-python-vulkan-amd
+            model: granite
+            flavor: vulkan/amd64
+            directory: llamacpp_python
            platforms: linux/amd64
-            cuda: 1
+            no_gpu: 0
+          - image_name: llamacpp-python-vulkan-arm
+            model: granite
+            flavor: vulkan/arm64
+            directory: llamacpp_python
+            platforms: linux/arm64
+            no_gpu: 0
          - image_name: whispercpp
            model: whisper-small
            flavor: base
            directory: whispercpp
            platforms: linux/amd64,linux/arm64
            no_gpu: 1
-    runs-on: ubuntu-22.04
+          - image_name: object_detection_python
+            model: facebook-detr-resnet-101
+            flavor: base
+            directory: object_detection_python
+            platforms: linux/amd64,linux/arm64
+            no_gpu: 1
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -59,12 +81,17 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
          sudo apt-get update
          sudo apt-get install -y qemu-user-static
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
      
      - name: Build Image
        id: build_image
@ -72,7 +99,7 @@ jobs:
        with:
          image: ${{ env.REGISTRY }}/${{ github.repository_owner}}/${{ matrix.image_name }}
          platforms: ${{ matrix.platforms }}
-          tags: latest
+          tags: latest ${{ github.ref_type == 'tag' && github.ref_name || '' }}
          containerfiles: ./model_servers/${{ matrix.directory }}/${{ matrix.flavor }}/Containerfile
          context: model_servers/${{ matrix.directory }}/

@ -80,11 +107,6 @@ jobs:
        working-directory: ./models
        run: make download-model-${{ matrix.model }}

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install python dependencies
        working-directory: ./model_servers/${{ matrix.directory }}/
        run: make install
--- a/.github/workflows/models.yaml
+++ b/.github/workflows/models.yaml
@ -8,12 +8,12 @@ on:
    branches:
      - main
    paths:
-      - .github/workflows/model_image_build_push.yaml
+      - .github/workflows/models.yaml
  push:
    branches:
      - main
    paths:
-      - .github/workflows/model_image_build_push.yaml
+      - .github/workflows/models.yaml
  
  workflow_dispatch:

@ -46,7 +46,7 @@ jobs:
          - image_name: whisper-small
            url: https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin
            platforms: linux/amd64,linux/arm64
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -56,7 +56,7 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -78,7 +78,7 @@ jobs:
          context: models

      - name: Login to Container Registry
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        if: (github.event_name == 'push' && github.ref == 'refs/heads/main') || (github.event_name == 'workflow_dispatch' && github.ref == 'refs/heads/main')
        uses: redhat-actions/podman-login@v1.7
        with:
          registry: ${{ env.REGISTRY }}
@ -86,7 +86,7 @@ jobs:
          password: ${{ secrets.REGISTRY_PASSWORD }}

      - name: Push image
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        if: (github.event_name == 'push' && github.ref == 'refs/heads/main') || (github.event_name == 'workflow_dispatch' && github.ref == 'refs/heads/main')
        uses: redhat-actions/push-to-registry@v2.8
        with:
          image: ${{ steps.build_image.outputs.image }}
--- a/.github/workflows/object_detection.yaml
+++ b/.github/workflows/object_detection.yaml
@ -0,0 +1,89 @@
+name: Object Detection
+
+on:
+  pull_request:
+    branches:
+      - main
+    paths:
+      - ./recipes/computer_vision/object_detection/**
+      - .github/workflows/object_detection.yaml
+  push:
+    branches:
+      - main
+    paths:
+      - ./recipes/computer_vision/object_detection/**
+      - .github/workflows/object_detection.yaml
+
+  workflow_dispatch:
+
+env:
+  REGISTRY: ghcr.io
+  REGISTRY_ORG: containers
+  RECIPE_NAME: object_detection
+  RECIPE_TYPE: computer_vision
+  IMAGE_NAME: object_detection_client
+
+jobs:
+  object-detection-client-build-and-push:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-24.04
+    permissions:
+      contents: read
+      packages: write
+    services:
+      registry:
+        image: registry:2.8.3
+        ports:
+          - 5000:5000
+    steps:
+      - uses: actions/checkout@v4.1.7
+
+      - name: Install qemu dependency
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y qemu-user-static
+
+      - name: Build Image
+        id: build_image
+        uses: redhat-actions/buildah-build@v2.13
+        with:
+          image: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/${{ env.IMAGE_NAME }}
+          tags: latest
+          platforms: linux/amd64,linux/arm64
+          containerfiles: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}/app/Containerfile
+          context: recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}/app
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
+
+      - name: Install Dependencies
+        working-directory: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}
+        run: make install
+
+      - name: Download model
+        working-directory: ./models
+        run: make download-model-facebook-detr-resnet-101
+
+      - name: Run Functional Tests
+        shell: bash
+        run: make functional-tests
+        working-directory: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}
+
+      - name: Login to Registry
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/podman-login@v1.7
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Push Image
+        id: push_image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ steps.build_image.outputs.image }}
+          tags: ${{ steps.build_image.outputs.tags }}
+          registry: ${{ env.REGISTRY }}
--- a/.github/workflows/rag.yaml
+++ b/.github/workflows/rag.yaml
@ -5,16 +5,16 @@ on:
    branches:
      - main
    paths:
-      - ./recipes/common/Makefile.common
-      - ./recipes/natural_language_processing/rag/**
-      - .github/workflows/rag.yaml
+      - 'recipes/common/Makefile.common'
+      - 'recipes/natural_language_processing/rag/**'
+      - '.github/workflows/rag.yaml'
  push:
    branches:
      - main
    paths:
-      - ./recipes/common/Makefile.common
-      - ./recipes/natural_language_processing/rag/**
-      - .github/workflows/rag.yaml
+      - 'recipes/common/Makefile.common'
+      - 'recipes/natural_language_processing/rag/**'
+      - '.github/workflows/rag.yaml'

  workflow_dispatch:

@ -25,7 +25,7 @@ env:
 jobs:
  rag-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -40,7 +40,7 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -58,7 +58,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

--- a/.github/workflows/summarizer.yaml
+++ b/.github/workflows/summarizer.yaml
@ -25,7 +25,7 @@ env:
 jobs:
  summarizer-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,7 +35,7 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -53,7 +53,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

--- a/.github/workflows/test-trace-steps.yaml
+++ b/.github/workflows/test-trace-steps.yaml
@ -0,0 +1,94 @@
+# To run locally
+# act -W .github/workflows/test-trace-steps.yaml --container-architecture linux/amd64 -b ci/logs:/logs
+
+name: Test Workflow
+
+on:
+  pull_request:
+    branches:
+      - main
+    paths:
+      - .github/workflows/test-trace-steps.yaml
+  workflow_dispatch:
+
+jobs:
+  test-build:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-24.04
+    steps:
+    - uses: actions/checkout@v4.1.7
+    - name: Set up Python
+      uses: actions/setup-python@v5.1.1
+      with:
+        python-version: '3.11'
+
+    - name: Install Python dependencies
+      run: |
+        pip install --no-cache-dir opentelemetry-sdk opentelemetry-exporter-otlp opentelemetry-instrumentation
+
+    - name: Download OpenTelemetry Collector Contrib
+      run: |
+        wget https://github.com/open-telemetry/opentelemetry-collector-releases/releases/download/v0.103.0/otelcol-contrib_0.103.0_linux_amd64.tar.gz
+        tar -xvf otelcol-contrib_0.103.0_linux_amd64.tar.gz
+
+    - name: Write secrets to files
+      run: |
+        echo "${{ secrets.ROSA_OTEL_CACERT }}" > /tmp/ca.crt
+        echo "${{ secrets.ROSA_OTEL_SERVER_CRT }}" > /tmp/server.crt
+        echo "${{ secrets.ROSA_OTEL_SERVER_KEY }}" > /tmp/server.key
+
+    - name: Configure OpenTelemetry Collector
+      run: |
+        echo '
+        receivers:
+          otlp:
+            protocols:
+              grpc:
+              http:
+        exporters:
+          otlphttp:
+            endpoint: "${{ secrets.ROSA_OTEL_ENDPOINT }}"
+            tls:
+              insecure: false
+              cert_file: /tmp/server.crt
+              key_file: /tmp/server.key
+              ca_file: /tmp/ca.crt
+          debug:
+            verbosity: detailed
+        service:
+          pipelines:
+            traces:
+              receivers: [otlp]
+              exporters: [debug, otlphttp]
+        ' > otel-collector-config.yaml
+
+    - name: Run OpenTelemetry Collector
+      run: |
+        ./otelcol-contrib --config otel-collector-config.yaml > otel-collector.log 2>&1 &
+
+    - name: Start job trace
+      run: |
+        export WORKFLOW_NAME="test-trace"
+        export JOB_NAME="test-build"
+        export TRACE_ACTION="start"
+        python ci/trace-steps.py
+
+    - name: Build
+      run: |
+        echo "Simulating build step..."
+        sleep 2
+
+    - name: Test
+      run: |
+        echo "Simulating test step..."
+        sleep 2
+
+    - name: End job trace
+      run: |
+        export WORKFLOW_NAME="test-trace"
+        export JOB_NAME="test-build"
+        export TRACE_ACTION="end"
+        python ci/trace-steps.py
+
+    - name: Display OpenTelemetry Collector Logs
+      run: cat otel-collector.log
--- a/.github/workflows/testing_framework.yaml
+++ b/.github/workflows/testing_framework.yaml
@ -1,10 +1,10 @@
 name: Testing Framework

 on:
-  schedule: # schedule the job to run every hour
-   - cron: '0 * * * *'
-  
-  workflow_dispatch:
+  schedule: # schedule the job to run once a day
+   - cron: '0 0 * * *'
+
+  #workflow_dispatch:

  # pull_request: ## temporary for debugging development purposes
  #   branches:
@ -13,7 +13,7 @@ on:
 env:
  TF_VAR_aws_region: "eu-west-2"
  TF_VAR_aws_ami_owners: '["125523088429"]'
-  TF_VAR_aws_ami_name: '["Fedora-Cloud-Base-*"]'
+  TF_VAR_aws_ami_name: '["Fedora-Cloud-Base-39*"]'
  TF_VAR_aws_volume_size: 100
  TF_VAR_aws_access_key: ${{ secrets.AWS_ACCESS_KEY_ID }}
  TF_VAR_aws_secret_key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
@ -28,13 +28,13 @@ concurrency:
 jobs:
  integration-tests:
    if: github.repository == 'containers/ai-lab-recipes'
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    strategy:
      fail-fast: false
      matrix:
        include:
          - arch: amd64
-            aws_image_type: t3a.medium	
+            aws_image_type: t3a.medium
            aws_ami_architecture: x86_64
          - arch: arm64
            aws_image_type: m7g.medium
@ -44,20 +44,25 @@ jobs:
            aws_ami_architecture: x86_64
    steps:
      - name: Checkout
-        uses: actions/checkout@v4.1.4
+        uses: actions/checkout@v4.1.7
        with:
-          path: main
+          ref: 'main'
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'

      - name: Checkout terraform module
        id: checkout-module
-        uses: actions/checkout@v4.1.4
+        uses: actions/checkout@v4.1.7
        with:
          repository: containers/terraform-test-environment-module
          path: terraform-test-environment-module
          ref: 'main'

      - name: Setup Terraform
-        uses: hashicorp/setup-terraform@v3.1.0
+        uses: hashicorp/setup-terraform@v3.1.2
        with:
          terraform_version: "1.7.5"
          terraform_wrapper: false
@ -73,7 +78,7 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Terraform Output
        id: terraform-output
        run: |
@ -84,31 +89,26 @@ jobs:

      - name: Ansible Collections
        run: ansible-galaxy install -r ./provision/requirements.yml
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot

      - name: Provision
        run: |
-          ansible-playbook ./main/recipes/natural_language_processing/chatbot/provision/playbook.yml \
+          ansible-playbook ./recipes/natural_language_processing/chatbot/provision/playbook.yml \
            -i terraform-test-environment-module/hosts.ini \
            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }}
        env:
          ANSIBLE_HOST_KEY_CHECKING: false

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install Dependencies
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot
        run: make install

      - name: Run Integration Tests
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot
        run: make integration-tests
        env:
          URL: ${{ steps.terraform-output.outputs.url }}
- 
+
      - name: Destroy Test Environment
        id: down
        if: always()
@ -117,7 +117,7 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Publish Job Results to Slack
        id: slack
        if: always()
@ -131,7 +131,7 @@ jobs:
          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}

  release-images:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-24.04
    needs: integration-tests
    if: success()
    strategy:
@ -154,7 +154,7 @@ jobs:
        env:
          SOURCE_REGISTRY: ghcr.io/containers
          TARGET_REGISTRY: quay.io/ai-lab
-      
+
      - name: Publish Job Results to Slack
        id: slack
        if: always()
@ -171,7 +171,12 @@ jobs:
    if: github.repository == 'containers-mirror/ai-lab-recipes'
    runs-on: ubuntu-22.04-2core
    steps:
-      - uses: actions/checkout@v4.1.4
+      - uses: actions/checkout@v4.1.7
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'

      - name: chatbot
        working-directory: ./recipes/natural_language_processing/chatbot
--- a/.github/workflows/training-e2e.yaml
+++ b/.github/workflows/training-e2e.yaml
@ -1,25 +1,26 @@
 name: traning E2E

 on:
-  # schedule: # schedule the job to run every day at midnight
-  #  - cron: '0 * * * *'
+  schedule: # schedule the job to run every day at midnight
+    - cron: '0 12 * * *'

-  # For testing purposes, will remove
  pull_request:
    branches:
      - main
    paths:
      - .github/workflows/training-e2e.yaml
-  
+      - ./training/**
+
  workflow_dispatch:

 env:
  TF_VAR_aws_region: "eu-west-2"
-  TF_VAR_aws_ami_owners: '["125523088429"]'
-  TF_VAR_aws_ami_name: '["Fedora-Cloud-Base-*"]'
-  TF_VAR_aws_volume_size: 128
+  TF_VAR_aws_ami_owners: '["309956199498"]'
+  TF_VAR_aws_ami_name: '["*RHEL-9.4*"]'
+  TF_VAR_aws_volume_size: 500
  TF_VAR_aws_access_key: ${{ secrets.AWS_ACCESS_KEY_ID }}
  TF_VAR_aws_secret_key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+  HF_TOKEN: ${{ secrets.HF_TOKEN }}

 concurrency:
  group: ${{ github.workflow }}
@ -27,10 +28,11 @@ concurrency:

 jobs:
  e2e:
-    if: github.repository == 'containers/ai-lab-recipes'
-    runs-on: ubuntu-22.04
+    if: github.repository == 'containers/ai-lab-recipes' && !contains(github.event.pull_request.labels.*.name, 'hold-tests')
+    runs-on: ubuntu-24.04
    strategy:
      fail-fast: false
+      max-parallel: 1
      matrix:
        include:
          - arch: amd64
@ -39,20 +41,20 @@ jobs:
            aws_ami_architecture: x86_64
    steps:
      - name: Checkout
-        uses: actions/checkout@v4.1.4
+        uses: actions/checkout@v4.1.7
        with:
          path: main

      - name: Checkout terraform module
        id: checkout-module
-        uses: actions/checkout@v4.1.4
+        uses: actions/checkout@v4.1.7
        with:
          repository: containers/terraform-test-environment-module
          path: terraform-test-environment-module
          ref: 'main'

      - name: Setup Terraform
-        uses: hashicorp/setup-terraform@v3.1.0
+        uses: hashicorp/setup-terraform@v3.1.2
        with:
          terraform_version: "1.7.5"
          terraform_wrapper: false
@ -68,27 +70,67 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Terraform Output
        id: terraform-output
        run: |
          echo "id=$(terraform output id | xargs)" >> $GITHUB_OUTPUT
          echo "url=$(terraform output host | xargs)" >> $GITHUB_OUTPUT
+          echo "ssh_public_key=$(terraform output ssh_public_key | xargs)" >> $GITHUB_OUTPUT
          echo "pem_filename=$(terraform output pem_filename | xargs)" >> $GITHUB_OUTPUT
        working-directory: terraform-test-environment-module

      - name: Ansible Collections
-        run: ansible-galaxy install -r ./provision/requirements.yml
+        run: ansible-galaxy install -r ./tests/provision/requirements.yml
        working-directory: ./main/training

      - name: Provision
        run: |
-          ansible-playbook ./main/training/provision/playbook.yml \
+          ansible-playbook ./main/training/tests/provision/playbook.yml \
            -i terraform-test-environment-module/hosts.ini \
            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }} \
-            --extra-vars "image_name=${{ matrix.image_name }}" 
+            --extra-vars "image_name=${{ matrix.image_name }}" \
+            --extra-vars "ssh_public_key='${{ steps.terraform-output.outputs.ssh_public_key }}'" \
+            --extra-vars "registry_user=${{ secrets.REGISTRY_USER }}" \
+            --extra-vars "registry_password=${{ secrets.REGISTRY_PASSWORD }}"
        env:
-          ANSIBLE_HOST_KEY_CHECKING: false
+          ANSIBLE_CONFIG: ./main/training/tests/ansible.cfg
+
+      # - name: Setup tmate session
+      #   uses: mxschmitt/action-tmate@v3.18
+      #   timeout-minutes: 20
+      #   with:
+      #     detached: true
+      #     limit-access-to-actor: false
+
+      - name: Setup tmate session
+        uses: mxschmitt/action-tmate@v3.18
+        timeout-minutes: 60
+        with:
+          detached: true
+          limit-access-to-actor: false
+
+      - name: Run tests
+        run: |
+          ansible-playbook ./main/training/tests/e2e-tests/playbook.yml \
+            -i terraform-test-environment-module/hosts.ini \
+            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }} \
+            --extra-vars "HF_TOKEN=${{ secrets.HF_TOKEN }}" \
+            --extra-vars "image_name=${{ matrix.image_name }}" \
+            --extra-vars "ssh_public_key='${{ steps.terraform-output.outputs.ssh_public_key }}'" \
+            --extra-vars "registry_user=${{ secrets.REGISTRY_USER }}" \
+            --extra-vars "registry_password=${{ secrets.REGISTRY_PASSWORD }}"
+        env:
+          ANSIBLE_CONFIG: ./main/training/tests/ansible.cfg
+
+      # This should exist in the final workflow
+      # - name: Setup tmate session
+      #   if: ${{ failure() }}
+      #   uses: mxschmitt/action-tmate@v3.18
+      #   timeout-minutes: 15
+      #   with:
+      #     detached: true
+      #     limit-access-to-actor: false

      - name: Destroy Test Environment
        id: down
@ -98,7 +140,7 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Publish Job Results to Slack
        id: slack
        if: always()
--- a/.github/workflows/training_bootc.yaml
+++ b/.github/workflows/training_bootc.yaml
@ -1,22 +1,12 @@
 name: Training Bootc image builds

 on:
-  schedule: # schedule the job to run at 12 AM daily
-   - cron: '0 0 * * *'
+  push:
+    branches: [ main ]
+    paths:
+      - 'training/**'
+      - '.github/workflows/training_bootc.yaml'

-  # pull_request:
-  #   branches:
-  #     - main
-  #   paths:
-  #     - .github/workflows/instructlab_baseimages_build_push.yaml
-  #     - training/nvidia
-  # push:
-  #   branches:
-  #     - main
-  #   paths:
-  #     - .github/workflows/instructlab_baseimages_build_push.yaml
-  #     - training/nvidia
-  
  workflow_dispatch:

 concurrency:
@ -26,53 +16,84 @@ concurrency:
 env:
  REGISTRY: quay.io
  REGISTRY_ORG: ai-lab
+  REGION: us-east-1

 jobs:
+  start-runner:
+    name: Start self-hosted EC2 runner
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-latest
+    outputs:
+      label: ${{ steps.start-ec2-runner.outputs.label }}
+      ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }}
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@v1
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ env.REGION }}
+      - name: Start EC2 runner
+        id: start-ec2-runner
+        uses: machulav/ec2-github-runner@v2
+        with:
+          mode: start
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          ec2-image-id: ami-0154957ba4ce98784
+          ec2-instance-type: m7i.12xlarge
+          subnet-id: subnet-0b1e1d94240813658
+          security-group-id: sg-055105753f5e8bd83
+
  nvidia-bootc-builder-image:
-    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests') && github.repository == 'containers-mirror/ai-lab-recipes'"
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
    strategy:
      matrix:
        include:
          - image_name: nvidia-builder
            context: training/nvidia-bootc
            arch: amd64
-    runs-on: ubuntu-22.04
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    needs: start-runner
    permissions:
      contents: read
      packages: write
    steps:
-      - name: Remove unnecessary files
-        run: |
-          sudo rm -rf /usr/share/dotnet
-          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+      - uses: actions/checkout@v4.1.7

-      - uses: actions/checkout@v4.1.4
-
-      - name: Install qemu dependency
+      - name: mkdir root/.docker directory
        run: |
-          sudo apt-get update
-          sudo apt-get install -y qemu-user-static
-      
-      - name: Build Image
-        id: build_image
-        run: make dtk ARCH=${{ matrix.arch }}
-        working-directory: ${{ matrix.context }}
+          mkdir -p ~/.docker

      - name: Login to Container Registry
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
-        uses: redhat-actions/podman-login@v1.7
-        with:
-          registry: ${{ env.REGISTRY }}
-          username: ${{ secrets.REGISTRY_USER }}
-          password: ${{ secrets.REGISTRY_PASSWORD }}
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+      - name: generate a ssh key - USER SHOULD INJECT THEIR OWN AND REBUILD IF THEY USE THIS IMAGE
+        run: |
+          ssh-keygen -t rsa -b 4096 -f ~/.ssh/id_rsa -N ""
+
+      - name: Build Image
+        id: build_image
+        run: make driver-toolkit ARCH=${{ matrix.arch }}
+        working-directory: ${{ matrix.context }}
+
+      - name: tag image as nvidia-builder
+        run: podman tag ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/driver-toolkit:latest ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/${{ matrix.image_name}}:latest

      - name: Push image
        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
        uses: redhat-actions/push-to-registry@v2.8
        with:
-          image: ${{ steps.build_image.outputs.image }}
-          tags: ${{ steps.build_image.outputs.tags }}
-          registry: ${{ env.REGISTRY }}
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}
+          image: driver-toolkit
+          tags: latest
+
+      - name: push the nvidia-builder image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ matrix.image_name}}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}

      - name: Publish Job Results to Slack
        id: slack
@ -87,8 +108,6 @@ jobs:
          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}

  nvidia-bootc-image:
-    if: "success() && !contains(github.event.pull_request.labels.*.name, 'hold-tests') && github.repository == 'containers-mirror/ai-lab-recipes'"
-    needs: nvidia-bootc-builder-image
    strategy:
      matrix:
        include:
@ -96,35 +115,43 @@ jobs:
            driver_version: "550.54.15"
            context: training/nvidia-bootc
            arch: amd64
-    runs-on: ubuntu-22.04-8-cores
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    needs: [ nvidia-bootc-builder-image, start-runner ]
    steps:
-      - name: Remove unnecessary files
-        run: |
-          sudo rm -rf /usr/share/dotnet
-          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+      - uses: actions/checkout@v4.1.7
+
+      - name: mkdir root/.docker directory
+        run: |
+          mkdir -p ~/.docker
+
+      - name: generate a ssh key - USER SHOULD INJECT THEIR OWN AND REBUILD IF THEY USE THIS IMAGE and overwrite the existing one
+        run: |
+          ssh-keygen -t rsa -b 4096 -f ~/.ssh/id_rsa -N "" <<<y
+
+      - name: Login to Container Registry
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+
+      - name: generate the local OCI assets
+        run: |
+          cd training
+          make -j vllm
+          make -j deepspeed
+          make -j instruct-nvidia

-      - uses: actions/checkout@v4.1.4
-      
      - name: Build Image
        id: build_image
-        run: make bootc DRIVER_VERSION=${{ matrix.driver_version }} ARCH=${{ matrix.arch }}
+        run: make bootc DRIVER_VERSION=${{ matrix.driver_version }} ARCH=${{ matrix.arch }} SSH_PUBKEY=~/.ssh/id_rsa.pub
        working-directory: ${{ matrix.context }}
-        
-      - name: Login to Container Registry
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
-        uses: redhat-actions/podman-login@v1.7
-        with:
-          registry: ${{ env.REGISTRY }}
-          username: ${{ secrets.REGISTRY_USER }}
-          password: ${{ secrets.REGISTRY_PASSWORD }}

      - name: Push image
        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
        uses: redhat-actions/push-to-registry@v2.8
        with:
-          image: ${{ steps.build_image.outputs.image }}
-          tags: ${{ steps.build_image.outputs.tags }}
-          registry: ${{ env.REGISTRY }}
+          image: ${{ matrix.image_name }}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}

      - name: Publish Job Results to Slack
        id: slack
@ -138,46 +165,51 @@ jobs:
        env:
          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}

-  intel-and-amd-bootc-image:
-    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests') && github.repository == 'containers-mirror/ai-lab-recipes'"
+  bootc-images:
    strategy:
      matrix:
        include:
          - image_name: intel-bootc
            context: training/intel-bootc
            arch: amd64
+            gpu: intel
          - image_name: amd-bootc
            context: training/amd-bootc
            arch: amd64
-    runs-on: ubuntu-latest
+            gpu: amd
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    needs: [ start-runner, nvidia-bootc-builder-image ]
+    continue-on-error: true
    steps:
-      - name: Remove unnecessary files
-        run: |
-          sudo rm -rf /usr/share/dotnet
-          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+      - uses: actions/checkout@v4.1.7

-      - uses: actions/checkout@v4.1.4
-      
-      - name: Build Image
-        id: build_image
-        run: make bootc ARCH=${{ matrix.arch }}
-        working-directory: ${{ matrix.context }}
+      - name: mkdir root/.docker directory
+        run: |
+          mkdir -p ~/.docker

      - name: Login to Container Registry
-        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
-        uses: redhat-actions/podman-login@v1.7
-        with:
-          registry: ${{ env.REGISTRY }}
-          username: ${{ secrets.REGISTRY_USER }}
-          password: ${{ secrets.REGISTRY_PASSWORD }}
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+      - name: generate the local OCI assets
+        run: |
+          cd training
+          make -j vllm
+          make -j deepspeed
+          make -j instruct-${{ matrix.gpu}}
+
+      - name: Build Image
+        id: build_image
+        run: make bootc ARCH=${{ matrix.arch }} INSTRUCTLAB_IMAGE=${{env.REGISTRY}}/${{env.REGISTRY_ORG}}/instruct-${{ matrix.gpu }}:latest
+        working-directory: ${{ matrix.context }}

      - name: Push image
        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
        uses: redhat-actions/push-to-registry@v2.8
        with:
-          image: ${{ steps.build_image.outputs.image }}
-          tags: ${{ steps.build_image.outputs.tags }}
-          registry: ${{ env.REGISTRY }}
+          image: ${{ matrix.image_name }}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}

      - name: Publish Job Results to Slack
        id: slack
@ -190,3 +222,26 @@ jobs:
            }
        env:
          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
+
+  stop-runner:
+    name: Stop self-hosted EC2 runner
+    needs:
+      - start-runner
+      - bootc-images
+      - nvidia-bootc-image
+    runs-on: ubuntu-latest
+    if: ${{ always() }} # required to stop the runner even if the error happened in the previous jobs
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@v1
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ secrets.AWS_REGION }}
+      - name: Stop EC2 runner
+        uses: machulav/ec2-github-runner@v2
+        with:
+          mode: stop
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          label: ${{ needs.start-runner.outputs.label }}
+          ec2-instance-id: ${{ needs.start-runner.outputs.ec2-instance-id }}
--- a/.gitignore
+++ b/.gitignore
@ -10,5 +10,9 @@ models/*
 convert_models/converted_models
 recipes/common/bin/*
 */.venv/
+**/venv/**
 training/cloud/examples
 training/instructlab/instructlab
+vector_dbs/milvus/volumes/milvus/*
+.idea
+**/volumes/**
--- a/2
+++ b/2
@ -1 +1 @@
-* @MichaelClifford @rhatdan @sallyom @lmilbaum @cgwalters @Gregory-Pereira
+* @MichaelClifford @rhatdan @sallyom @cgwalters @Gregory-Pereira @jeffmaury
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@ -44,7 +44,7 @@ application:
      containerfile: ./base/Containerfile
      model-service: true
      backend: 
-        - llama
+        - llama-cpp
      arch:
        - arm64
        - amd64
--- a/README.md
+++ b/README.md
@ -1,5 +1,7 @@
 # AI Lab Recipes

+![](/assets/ai_lab_recipes_logo.png) 
+
 This repo contains recipes for building and running containerized AI and LLM
 Applications with Podman.

@ -54,3 +56,15 @@ currently built images are  tracked in
 ## [Training](./training/README.md)

 Linux Operating System Bootable containers enabled for AI Training
+
+## Setting Up Git Hooks
+
+To install our standard git hooks, run the following command:
+
+```sh
+./install-hooks.sh
+```
+
+### pre-commit hook
+
+Ensures that `training/ilab-wrapper/ilab` is duplicated into `training/nvidia-bootc/duplicated/ilab-wrapper/ilab`
--- a/ailab-images.md
+++ b/ailab-images.md
@ -16,11 +16,6 @@

 Images used in the `Bootc` aspect of this repo or tooling images

- quay.io/ai-lab/nvidia-builder:latest
- quay.io/ai-lab/instructlab-nvidia:latest
- quay.io/ai-lab/nvidia-bootc:latest
- quay.io/ai-lab/intel-bootc:latest
- quay.io/ai-lab/amd-bootc:latest
 - quay.io/ai-lab/chromadb:latest
 - quay.io/ai-lab/model-converter:latest

--- a/assets/ai_lab_recipes_logo.png
+++ b/assets/ai_lab_recipes_logo.png
--- a/assets/chatbot_nodejs_ui.png
+++ b/assets/chatbot_nodejs_ui.png
--- a/assets/function_calling_nodejs_ui.png
+++ b/assets/function_calling_nodejs_ui.png
--- a/assets/rag_nodejs.png
+++ b/assets/rag_nodejs.png
--- a/ci/trace-steps.py
+++ b/ci/trace-steps.py
@ -0,0 +1,47 @@
+import os
+import time
+from datetime import datetime
+from opentelemetry import trace
+from opentelemetry.sdk.resources import Resource
+from opentelemetry.sdk.trace import TracerProvider
+from opentelemetry.sdk.trace.export import BatchSpanProcessor, ConsoleSpanExporter
+from opentelemetry.exporter.otlp.proto.grpc.trace_exporter import OTLPSpanExporter
+
+service_name = os.getenv("WORKFLOW_NAME", "default_service")
+job_name = os.getenv("JOB_NAME", "default_job")
+
+resource = Resource.create({"service.name": service_name})
+trace.set_tracer_provider(TracerProvider(resource=resource))
+tracer = trace.get_tracer(__name__)
+console_span_processor = BatchSpanProcessor(ConsoleSpanExporter())
+trace.get_tracer_provider().add_span_processor(console_span_processor)
+
+# Adding OTLP Span Exporter for actual data export
+otlp_exporter = OTLPSpanExporter(endpoint="localhost:4317", insecure=True)
+otlp_span_processor = BatchSpanProcessor(otlp_exporter)
+trace.get_tracer_provider().add_span_processor(otlp_span_processor)
+
+print("Tracer initialized with service name:", service_name)
+
+def set_start_time():
+    start_time = datetime.now().timestamp()
+    with open("/tmp/start_time.txt", "w") as file:
+        file.write(str(start_time))
+    print("Start time recorded")
+
+def calculate_duration():
+    with open("/tmp/start_time.txt", "r") as file:
+        start_time = float(file.read())
+    end_time = datetime.now().timestamp()
+    duration = end_time - start_time
+    print(f"Total Duration: {duration}s")
+    with tracer.start_as_current_span(job_name) as span:
+        span.set_attribute("total_duration_s", duration)
+
+if __name__ == "__main__":
+    action = os.getenv("TRACE_ACTION", "start")
+
+    if action == "start":
+        set_start_time()
+    elif action == "end":
+        calculate_duration()
--- a/convert_models/Containerfile
+++ b/convert_models/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /opt/app-root/src/converter
 USER root
 RUN chown -R default:root /opt/app-root/src/converter
--- a/convert_models/README.md
+++ b/convert_models/README.md
@ -19,10 +19,10 @@ podman build -t converter .

 ## Quantize and Convert 

-You can run the conversion image directly with podman in the terminal. You just need to provide it with the huggingface model name you want to download, the quantization level you want to use and whether or not you want to keep the raw files after conversion.
+You can run the conversion image directly with podman in the terminal. You just need to provide it with the huggingface model name you want to download, the quantization level you want to use and whether or not you want to keep the raw files after conversion. "HF_TOKEN" is optional, it is required for private models.

 ```bash
-podman run -it --rm -v models:/converter/converted_models -e HF_MODEL_URL=<ORG/MODEL_NAME> -e QUANTIZATION=Q4_K_M -e KEEP_ORIGINAL_MODEL="False"
+podman run -it --rm -v models:/converter/converted_models -e HF_MODEL_URL=<ORG/MODEL_NAME> -e HF_TOKEN=<YOUR_HF_TOKEN_ID> -e QUANTIZATION=Q4_K_M -e KEEP_ORIGINAL_MODEL="False" converter
 ```

 You can also use the UI shown above to do the same.
--- a/convert_models/download_huggingface.py
+++ b/convert_models/download_huggingface.py
@ -3,9 +3,11 @@ import argparse

 parser = argparse.ArgumentParser()
 parser.add_argument("-m", "--model")
+parser.add_argument("-t", "--token")
 args = parser.parse_args()

 snapshot_download(repo_id=args.model,
+                token=args.token,
                local_dir=f"converted_models/{args.model}",
                local_dir_use_symlinks=True,
                cache_dir=f"converted_models/cache")
--- a/convert_models/run.sh
+++ b/convert_models/run.sh
@ -1,6 +1,7 @@
 #! /bin/bash

 hf_model_url=${HF_MODEL_URL}
+hf_token=${HF_TOKEN:="None"}
 model_org=$(echo $hf_model_url | sed -n 's/\(.*\)\/\(.*\)/\1/p')
 model_name=$(echo $hf_model_url | sed -n 's/\(.*\)\/\(.*\)/\2/p')
 keep_orgi=${KEEP_ORIGINAL_MODEL}
@ -15,11 +16,11 @@ if [ -e "/opt/app-root/src/converter/converted_models/cache/models--$model_org--
 fi

 echo "Downloading $hf_model_url"
-python download_huggingface.py --model $hf_model_url
-python llama.cpp/convert.py /opt/app-root/src/converter/converted_models/$hf_model_url
-python llama.cpp/convert-hf-to-gguf.py /opt/app-root/src/converter/converted_models/$hf_model_url
+python download_huggingface.py --model $hf_model_url --token $hf_token
+python llama.cpp/examples/convert_legacy_llama.py /opt/app-root/src/converter/converted_models/$hf_model_url
+python llama.cpp/convert_hf_to_gguf.py /opt/app-root/src/converter/converted_models/$hf_model_url
 mkdir -p /opt/app-root/src/converter/converted_models/gguf/
-llama.cpp/quantize /opt/app-root/src/converter/converted_models/$hf_model_url/ggml-model-f16.gguf /opt/app-root/src/converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf ${QUANTIZATION}
+llama.cpp/llama-quantize /opt/app-root/src/converter/converted_models/$hf_model_url/ggml-model-f16.gguf /opt/app-root/src/converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf ${QUANTIZATION}
 rm -rf /opt/app-root/src/converter/converted_models/$model_org

 if [ $keep_orgi = "False" ]; then
--- a/convert_models/ui.py
+++ b/convert_models/ui.py
@ -22,6 +22,9 @@ with col2:

 model_name = st.text_input(label="Enter a huggingface model url to convert",
                           placeholder="org/model_name")
+token_id = st.text_input(label="Enter your huggingface token (optional)",
+                         help="huggingface token is required for private model"
+                        ) or "None"
 keep_files = st.checkbox("Keep huggingface model files after conversion?")
 submit_button = st.button(label="submit")
 if submit_button:
@ -30,8 +33,9 @@ if submit_button:
                        "run", 
                        "-it", 
                        "--rm", 
-                        "-v", f"{volume}:/opt/app-root/src/converter/converted_models", 
-                        "-e", f"HF_MODEL_URL={model_name}" ,
+                        "-v", f"{volume}:/converter/converted_models", 
+                        "-e", f"HF_MODEL_URL={model_name}",
+                        "-e", f"HF_TOKEN={token_id}",
                        "-e", f"QUANTIZATION={quantization}",
                        "-e", f"KEEP_ORIGINAL_MODEL={keep_files}",
                        "converter"],stdout=subprocess.PIPE) 
--- a/eval/embeddings/custom_eval_set.py
+++ b/eval/embeddings/custom_eval_set.py
@ -0,0 +1,98 @@
+from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddings
+from langchain_openai import ChatOpenAI
+from langchain.chains import LLMChain
+from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+import matplotlib.pyplot as plt
+import os
+from scipy.spatial.distance import cosine
+import streamlit as st
+
+
+model_service = os.getenv("MODEL_ENDPOINT",
+                          "http://localhost:8001")
+model_service = f"{model_service}/v1"
+
+embedding_model = os.getenv("EMBEDDING_MODEL",
+                            "BAAI/bge-base-en-v1.5")
+
+def get_embedding(string, e):
+    embeddings = e.embed_query(string)
+    return embeddings
+
+
+st.title("📊 Create Custom LLM Eval Set")  
+
+if "Question" not in st.session_state:
+    st.session_state["Question"] = "What is the Higgs Boson?"
+
+if "Answers" not in st.session_state:
+    st.session_state["Answers"] = {}
+    st.session_state["Answers"]["Right_Answer_1"] = "The Higgs boson, sometimes called the Higgs particle, is an elementary particle in the Standard Model of particle physics produced by the quantum excitation of the Higgs field, one of the fields in particle physics theory"
+    st.session_state["Answers"]["Wrong_Answer_1"] = "Alan Turing was the first person to conduct substantial research in the field that he called machine intelligence."
+
+st.session_state["Question"] = st.text_input(label="Question", value=st.session_state["Question"])
+
+col1,col2,col3 = st.columns(3)
+with col1:
+    st.session_state["Answers"]["Right_Answer_1"] = st.text_input("Right Answer 1", 
+                                                      value=st.session_state["Answers"]["Right_Answer_1"])
+with col2:
+    st.session_state["Answers"]["Right_Answer_2"] = st.text_input("Right Answer 2")
+
+with col3:
+    st.session_state["Answers"]["Right_Answer_3"] = st.text_input("Right Answer 3")
+
+
+col1,col2,col3 = st.columns(3)
+with col1:
+     st.session_state["Answers"]["Wrong_Answer_1"] = st.text_input("Wrong Answer 1", 
+                                                                  value=st.session_state["Answers"]["Wrong_Answer_1"])
+with col2:
+    st.session_state["Answers"]["Wrong_Answer_2"] = st.text_input("Wrong Answer 2")
+with col3:
+    st.session_state["Answers"]["Wrong_Answer_3"] = st.text_input("Wrong Answer 3")
+
+
+text = {k:[v] for (k,v) in st.session_state["Answers"].items() if v != ""}
+text["Question"] = [st.session_state["Question"]]
+e = SentenceTransformerEmbeddings(model_name=embedding_model)
+
+for t in text.keys():
+    text[t].append(get_embedding(text[t][0],e))
+
+answer_embedding = text["Question"][1]
+
+for t in text.keys():
+    question_embedding = text[t][1]
+    distance = cosine(answer_embedding, question_embedding)
+    text[t].append(round(distance,3))
+
+distances = [text[key][2] for key in text.keys()]
+ones = [1]* len(distances)
+fig = plt.figure()
+plt.vlines(1,.001,1)
+plt.scatter(ones, distances)
+for key in text.keys():
+   plt.annotate(key,(1, text[key][2]))
+plt.xticks([])
+plt.ylabel("Cosine Similarity")
+st.pyplot(fig)
+
+submit = st.button("Check Against Model")
+if submit:
+    llm = ChatOpenAI(base_url=model_service, 
+        api_key="sk-no-key-required")
+    
+    prompt = ChatPromptTemplate.from_messages([
+    ("system", "You are world class technical advisor."),
+    ("user", "{input}")])
+
+    chain = LLMChain(llm=llm, 
+                prompt=prompt,
+                verbose=False,)
+     
+    response = chain.invoke(st.session_state["Question"])
+    st.session_state["Answers"]["LLM Response"] = response["text"]
+    st.markdown(st.session_state["Answers"]["LLM Response"])
+    st.rerun()
+    
--- a/eval/promptfoo/README.md
+++ b/eval/promptfoo/README.md
@ -0,0 +1,15 @@
+# LLM Evaluation with Promptfoo
+
+We are using the [Promptfoo.dev](https://www.promptfoo.dev/) project for LLM model evaluation. 
+
+```
+ podman build -t promptfoo eval/promptfoo/build
+```
+
+Make sure you are running an LLM before starting the promptfoo container. 
+
+```
+podman run -it -p 15500:15500 -v <LOCAL/PATH/TO/>/locallm/eval/promptfoo/evals/:/promptfoo/evals:ro promptfoo
+```
+
+Go to `http://0.0.0.0:15500/setup/` to set up your tests.
--- a/eval/promptfoo/base/Containerfile
+++ b/eval/promptfoo/base/Containerfile
@ -0,0 +1,8 @@
+FROM registry.access.redhat.com/ubi9/nodejs-20-minimal:1-63.1725851021
+WORKDIR /promptfoo
+RUN npm install promptfoo
+ENV PROMPTFOO_DISABLE_TELEMETRY=1
+RUN mkdir evals
+ENV PROMPTFOO_CONFIG_DIR=/promptfoo/evals
+COPY promptfooconfig.yaml /promptfoo
+ENTRYPOINT [ "npx", "promptfoo@latest", "view", "--yes" ]
--- a/eval/promptfoo/base/promptfooconfig.yaml
+++ b/eval/promptfoo/base/promptfooconfig.yaml
@ -0,0 +1,31 @@
+# This configuration compares LLM output of 2 prompts x 2 GPT models across 3 test cases.
+# Learn more: https://promptfoo.dev/docs/configuration/guide
+description: 'My first eval'
+
+prompts:
+  - "Write a tweet about {{topic}}"
+  - "Write a very concise, funny tweet about {{topic}}"
+
+providers:
+  - openai:gpt-3.5-turbo-0613
+  - openai:gpt-4
+
+tests:
+  - vars:
+      topic: bananas
+
+  - vars:
+      topic: avocado toast
+    assert:
+      # For more information on assertions, see https://promptfoo.dev/docs/configuration/expected-outputs
+      - type: icontains
+        value: avocado
+      - type: javascript
+        value: 1 / (output.length + 1)  # prefer shorter outputs
+
+  - vars:
+      topic: new york city
+    assert:
+      # For more information on model-graded evals, see https://promptfoo.dev/docs/configuration/expected-outputs/model-graded
+      - type: llm-rubric
+        value: ensure that the output is funny
--- a/eval/promptfoo/evals/README.md
+++ b/eval/promptfoo/evals/README.md
@ -0,0 +1 @@
+Directory to store evaluation runs locally
--- a/hooks/pre-commit
+++ b/hooks/pre-commit
@ -0,0 +1,13 @@
+#!/bin/bash
+
+SOURCE_FILE="training/ilab-wrapper/ilab"
+DEST_FILE="training/nvidia-bootc/duplicated/ilab-wrapper/ilab"
+
+if [[ -f "$SOURCE_FILE" ]]; then
+  mkdir -p "$(dirname "$DEST_FILE")"
+  cp "$SOURCE_FILE" "$DEST_FILE"
+  git add "$DEST_FILE"
+else
+  echo "Source file $SOURCE_FILE does not exist. Aborting commit."
+  exit 1
+fi
--- a/install-hooks.sh
+++ b/install-hooks.sh
@ -0,0 +1,8 @@
+#!/bin/bash
+
+HOOKS_DIR="hooks"
+GIT_HOOKS_DIR=".git/hooks"
+
+cp "$HOOKS_DIR/pre-commit" "$GIT_HOOKS_DIR/pre-commit"
+
+echo "Hooks installed successfully."
--- a/model_servers/common/Makefile.common
+++ b/model_servers/common/Makefile.common
@ -1,6 +1,8 @@
+CONTAINER_TOOL ?= podman
 REGISTRY ?= quay.io
 REGISTRY_ORG ?= ai-lab
 COMPONENT ?= model_servers
+CHAT_FORMAT ?=

 BIND_MOUNT_OPTIONS := ro
 OS := $(shell uname -s)
@ -10,7 +12,7 @@ endif

 .PHONY: build
 build:
-	podman build --squash-all --build-arg $(PORT) -t $(IMAGE) . -f base/Containerfile
+	podman build --squash-all --build-arg PORT=$(PORT) -t $(IMAGE) . -f base/Containerfile

 .PHONY: install
 install:
@ -35,7 +37,15 @@ clean:
 .PHONY: run
 run:
 	cd ../../models && \
-	podman run -it -d -p $(PORT):$(PORT) -v ./$(MODEL_NAME):$(MODELS_PATH)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) -e MODEL_PATH=$(MODELS_PATH)/$(MODEL_NAME) -e HOST=0.0.0.0 -e PORT=$(PORT) $(IMAGE)
+	podman run -it \
+		-d \
+		-p $(PORT):$(PORT) \
+		-v ./$(MODEL_NAME):$(MODELS_PATH)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) \
+		-e MODEL_PATH=$(MODELS_PATH)/$(MODEL_NAME) \
+		-e HOST=0.0.0.0 \
+		-e PORT=$(PORT) \
+		$(CHAT_FORMAT:%=-e CHAT_FORMAT=${CHAT_FORMAT}) \
+		$(IMAGE)

 .PHONY: podman-clean
 podman-clean:
--- a/model_servers/llamacpp_python/Makefile
+++ b/model_servers/llamacpp_python/Makefile
@ -1,6 +1,6 @@
 APP := llamacpp_python
 PORT ?= 8001
-CHAT_FORMAT ?= openchat
+CHAT_FORMAT ?=

 include ../common/Makefile.common

@ -17,11 +17,13 @@ all: build download-model-granite run

 .PHONY: build-cuda
 build-cuda:
-	podman build --squash-all -t $(CUDA_IMAGE) . -f cuda/Containerfile
+	"${CONTAINER_TOOL}"  build --squash-all -t $(CUDA_IMAGE) . -f cuda/Containerfile

-.PHONY: build-vulkan
-build-vulkan:
-	podman build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/Containerfile
+.PHONY: build-vulkan-amd64 build-vulkan-arm64
+build-vulkan-amd64:
+	"${CONTAINER_TOOL}"  build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/amd64/Containerfile
+build-vulkan-arm64:
+	"${CONTAINER_TOOL}"  build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/arm64/Containerfile

 .PHONY: download-model-granite # default model
 download-model-granite:
--- a/model_servers/llamacpp_python/README.md
+++ b/model_servers/llamacpp_python/README.md
@ -1,26 +1,27 @@
-# Llamacpp_Python Model Sever
+# Llamacpp_Python Model Server

 The llamacpp_python model server images are based on the [llama-cpp-python](https://github.com/abetlen/llama-cpp-python) project that provides python bindings for [llama.cpp](https://github.com/ggerganov/llama.cpp). This provides us with a python based and OpenAI API compatible model server that can run LLM's of various sizes locally across Linux, Windows or Mac.

-This model server requires models to be converted from their original format, typically a set of `*.bin` or `*.safetensor` files into a single GGUF formatted file. Many models are available in GGUF format already on [huggingface.co](https://huggingface.co). You can also use the [model converter utility](../../convert_models/) available in this repo to convert models yourself.      
+This model server requires models to be converted from their original format, typically a set of `*.bin` or `*.safetensor` files into a single GGUF formatted file. Many models are available in GGUF format already on [huggingface.co](https://huggingface.co). You can also use the [model converter utility](../../convert_models/) available in this repo to convert models yourself.


 ## Image Options

-We currently provide 3 options for the llamacpp_python model server: 
-* [Base](#base) 
+We currently provide 3 options for the llamacpp_python model server:
+* [Base](#base)
 * [Cuda](#cuda)
-* [Vulkan (experimental)](#vulkan-experimental) 
+* [Vulkan (experimental)](#vulkan-experimental)

 ### Base

-The [base image](../llamacpp_python/base/Containerfile) is the standard image that works for both arm64 and amd64 environments. However, it does not includes any hardware acceleration and will run with CPU only. If you use the base image, make sure that your container runtime has sufficient resources to run the desired model(s).   
+The [base image](../llamacpp_python/base/Containerfile) is the standard image that works for both arm64 and amd64 environments. However, it does not includes any hardware acceleration and will run with CPU only. If you use the base image, make sure that your container runtime has sufficient resources to run the desired model(s).

 To build the base model service image:

 ```bash
-make -f Makefile build
+make build
 ```
+
 To pull the base model service image:

 ```bash
@ -30,11 +31,12 @@ podman pull quay.io/ai-lab/llamacpp_python

 ### Cuda

-The [Cuda image](../llamacpp_python/cuda/Containerfile) include all the extra drivers necessary to run our model server with Nvidia GPUs. This will significant speed up the models response time over CPU only deployments.   
+The [Cuda image](../llamacpp_python/cuda/Containerfile) include all the extra drivers necessary to run our model server with Nvidia GPUs. This will significant speed up the models response time over CPU only deployments.

 To Build the the Cuda variant image:
+
 ```bash
-make -f Makefile build-cuda
+make build-cuda
 ```

 To pull the base model service image:
@ -45,9 +47,10 @@ podman pull quay.io/ai-lab/llamacpp_python_cuda

 **IMPORTANT!**

-To run the Cuda image with GPU acceleration, you need to install the correct [Cuda drivers](https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#driver-installation) for your system along with the [Nvidia Container Toolkit](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html#). Please use the links provided to find installation instructions for your system. 
+To run the Cuda image with GPU acceleration, you need to install the correct [Cuda drivers](https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#driver-installation) for your system along with the [Nvidia Container Toolkit](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html#). Please use the links provided to find installation instructions for your system.
+
+Once those are installed you can use the container toolkit CLI to discover your Nvidia device(s).

-Once those are installed you can use the container toolkit CLI to discover your Nvidia device(s). 
 ```bash
 sudo nvidia-ctk cdi generate --output=/etc/cdi/nvidia.yaml
 ```
@ -57,13 +60,15 @@ Finally, you will also need to add `--device nvidia.com/gpu=all` to your `podman

 ### Vulkan (experimental)

-The [Vulkan image](../llamacpp_python/vulkan/Containerfile) is experimental, but can be used for gaining partial GPU access on an M-series Mac, significantly speeding up model response time over a CPU only deployment. This image requires that your podman machine provider is "applehv" and that you use krunkit instead of vfkit. Since these tools are not currently supported by podman desktop this image will remain "experimental".    
+The [Vulkan](https://docs.vulkan.org/guide/latest/what_is_vulkan.html) image ([amd64](../llamacpp_python/vulkan/amd64/Containerfile)/[arm64](../llamacpp_python/vulkan/arm64/Containerfile)) is experimental, but can be used for gaining partial GPU access on an M-series Mac, significantly speeding up model response time over a CPU only deployment. This image requires that your podman machine provider is "applehv" and that you use krunkit instead of vfkit. Since these tools are not currently supported by podman desktop this image will remain "experimental".

 To build the Vulkan model service variant image:

-```bash
-make -f Makefile build-vulkan
-```
+| System Architecture | Command |
+|---|---|
+| amd64 | make build-vulkan-amd64 |
+| arm64 | make build-vulkan-arm64 |
+
 To pull the base model service image:

 ```bash
@ -71,13 +76,12 @@ podman pull quay.io/ai-lab/llamacpp_python_vulkan
 ```


-
 ## Download Model(s)

 There are many models to choose from these days, most of which can be found on [huggingface.co](https://huggingface.co). In order to use a model with the llamacpp_python model server, it must be in GGUF format. You can either download pre-converted GGUF models directly or convert them yourself with the [model converter utility](../../convert_models/) available in this repo.

 A well performant Apache-2.0 licensed models that we recommend using if you are just getting started is
-`granite-7b-lab`. You can use the link below to quickly download a quantized (smaller) GGUF version of this model for use with the llamacpp_python model server. 
+`granite-7b-lab`. You can use the link below to quickly download a quantized (smaller) GGUF version of this model for use with the llamacpp_python model server.

 Download URL: [https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf](https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf)

@ -86,7 +90,7 @@ Place all models in the [models](../../models/) directory.
 You can use this snippet below to download the default model:

 ```bash
-make -f Makefile download-model-granite
+make download-model-granite
 ```

 Or you can use the generic `download-models` target from the `/models` directory to download any model file from huggingface:
@ -105,29 +109,30 @@ make MODEL_NAME=<model_name> MODEL_URL=<model_url> -f  Makefile download-model
 To deploy the LLM server you must specify a volume mount `-v` where your models are stored on the host machine and the `MODEL_PATH` for your model of choice. The model_server is most easily deploy from calling the make command: `make -f Makefile run`. Of course as with all our make calls you can pass any number of the following variables: `REGISTRY`, `IMAGE_NAME`, `MODEL_NAME`, `MODEL_PATH`, and `PORT`.

 ```bash
-podman run --rm -it \
+podman run --rm -d \
  -p 8001:8001 \
  -v Local/path/to/locallm/models:/locallm/models:ro \
-  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf 
-  -e HOST=0.0.0.0 
-  -e PORT=8001 
-  -e MODEL_CHAT_FORMAT=openchat
-  llamacpp_python \
+  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf \
+  -e HOST=0.0.0.0 \
+  -e PORT=8001 \
+  -e MODEL_CHAT_FORMAT=openchat \
+  llamacpp_python
 ```

 or with Cuda image

 ```bash
-podman run --rm -it \
-  --device nvidia.com/gpu=all
+podman run --rm -d \
+  --device nvidia.com/gpu=all \
  -p 8001:8001 \
  -v Local/path/to/locallm/models:/locallm/models:ro \
-  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf 
-  -e HOST=0.0.0.0 
-  -e PORT=8001 
-  -e MODEL_CHAT_FORMAT=openchat
-  llamacpp_python \
+  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf \
+  -e HOST=0.0.0.0 \
+  -e PORT=8001 \
+  -e MODEL_CHAT_FORMAT=openchat \
+  llamacpp_python
 ```
+
 ### Multiple Model Service:

 To enable dynamic loading and unloading of different models present on your machine, you can start the model service with a `CONFIG_PATH` instead of a `MODEL_PATH`.
@ -154,10 +159,10 @@ Here is an example `models_config.json` with two model options.
 }
 ```

-Now run the container with the specified config file. 
+Now run the container with the specified config file.

 ```bash
-podman run --rm -it -d \
+podman run --rm -d \
        -p 8001:8001 \
        -v Local/path/to/locallm/models:/locallm/models:ro \
        -e CONFIG_PATH=models/<config-filename> \
@ -172,4 +177,4 @@ Running tests

 ```bash
 make -f Makefile test
-```
+```
--- a/model_servers/llamacpp_python/base/Containerfile
+++ b/model_servers/llamacpp_python/base/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-62
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY src .
 USER root
--- a/model_servers/llamacpp_python/cuda/Containerfile
+++ b/model_servers/llamacpp_python/cuda/Containerfile
@ -4,7 +4,7 @@ RUN  dnf install -y gcc-toolset-13-gcc gcc-toolset-13-gcc-c++
 USER 1001
 WORKDIR /locallm
 COPY src .
-ENV CMAKE_ARGS="-DLLAMA_CUBLAS=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
+ENV CMAKE_ARGS="-DGGML_CUDA=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
 ENV FORCE_CMAKE=1
 RUN CC="/opt/rh/gcc-toolset-13/root/usr/bin/gcc" CXX="/opt/rh/gcc-toolset-13/root/usr/bin/g++" pip install --no-cache-dir -r ./requirements.txt
 ENTRYPOINT [ "sh", "run.sh" ]
--- a/model_servers/llamacpp_python/src/requirements.txt
+++ b/model_servers/llamacpp_python/src/requirements.txt
@ -1,2 +1,3 @@
-llama-cpp-python[server]==0.2.65
+llama-cpp-python[server]==0.2.90
+transformers==4.41.2
 pip==24.0
--- a/model_servers/llamacpp_python/src/run.sh
+++ b/model_servers/llamacpp_python/src/run.sh
@ -4,8 +4,21 @@ if [ ${CONFIG_PATH} ] || [[ ${MODEL_PATH} && ${CONFIG_PATH} ]]; then
    exit 0
 fi

+if [ "${MODEL_HF_PRETRAINED_MODEL}" == "None" ]; then
+    MODEL_HF_PRETRAINED_MODEL=""
+fi
+
 if [ ${MODEL_PATH} ]; then
-    python -m llama_cpp.server --model ${MODEL_PATH} --host ${HOST:=0.0.0.0} --port ${PORT:=8001} --n_gpu_layers ${GPU_LAYERS:=0} --clip_model_path ${CLIP_MODEL_PATH:=None} --chat_format ${MODEL_CHAT_FORMAT:="llama-2"}
+    python -m llama_cpp.server \
+        --model ${MODEL_PATH} \
+        --host ${HOST:=0.0.0.0} \
+        --port ${PORT:=8001} \
+        --n_gpu_layers ${GPU_LAYERS:=0} \
+        --clip_model_path ${CLIP_MODEL_PATH:=None} \
+        --chat_format ${MODEL_CHAT_FORMAT:=llama-2} \
+        ${PRETRAINED_MODEL_PATH:=} \
+        ${MODEL_HF_PRETRAINED_MODEL:+--hf_pretrained_model_name_or_path ${MODEL_HF_PRETRAINED_MODEL}} \
+        --interrupt_requests ${INTERRUPT_REQUESTS:=False}
    exit 0
 fi

--- a/model_servers/llamacpp_python/tooling_options.ipynb
+++ b/model_servers/llamacpp_python/tooling_options.ipynb
@ -203,7 +203,7 @@
    "from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler\n",
    "\n",
    "\n",
-    "llm = OpenAI(temperature=0.9,model_name=\"llama2\", base_url=\"http://localhost:8000/v1\", \n",
+    "llm = OpenAI(temperature=0.9,model_name=\"instructlab/granite-7b-lab\", base_url=\"http://localhost:8000/v1\", \n",
    "             openai_api_key=\"sk-no-key-required\", streaming=True,\n",
    "             callbacks=[StreamingStdOutCallbackHandler()])\n",
    "text = \"What would be a good company name for a company that makes colorful socks?\"\n",
--- a/model_servers/llamacpp_python/vulkan/amd64/Containerfile
+++ b/model_servers/llamacpp_python/vulkan/amd64/Containerfile
@ -0,0 +1,17 @@
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
+USER 0
+RUN dnf install -y python3-dnf-plugin-versionlock
+RUN dnf install -y mesa-vulkan-drivers-24.1.2-3.el9.x86_64
+RUN dnf versionlock mesa-vulkan-drivers-24.1.2-3.el9.x86_64
+RUN dnf install -y https://dl.fedoraproject.org/pub/epel/epel-release-latest-9.noarch.rpm
+RUN dnf install -y git cmake ninja-build gcc gcc-c++ 
+RUN dnf copr enable -y ligenix/enterprise-sandbox epel-9-x86_64
+RUN dnf install -y vulkan-headers vulkan-tools
+USER 1001
+WORKDIR /locallm
+COPY src .
+RUN pip install --upgrade pip
+ENV CMAKE_ARGS="-DLLAMA_VULKAN=on"
+ENV FORCE_CMAKE=1
+RUN pip install --no-cache-dir --upgrade -r /locallm/requirements.txt
+ENTRYPOINT [ "sh", "run.sh" ]
--- a/model_servers/llamacpp_python/vulkan/arm64/Containerfile
+++ b/model_servers/llamacpp_python/vulkan/arm64/Containerfile
@ -1,9 +1,11 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 USER 0
 RUN dnf install -y python3-dnf-plugin-versionlock && \
+    dnf install -y \
+https://dl.fedoraproject.org/pub/epel/epel-release-latest-9.noarch.rpm && \
    dnf copr enable -y slp/mesa-krunkit epel-9-aarch64 && \
-    dnf install -y mesa-vulkan-drivers-23.3.3-101.el9.aarch64 && \
-    dnf versionlock mesa-vulkan-drivers-23.3.3-101.el9.aarch64 && \
+    dnf install -y mesa-vulkan-drivers-24.1.2-101.el9.aarch64 && \
+    dnf versionlock mesa-vulkan-drivers-24.1.2-101.el9.aarch64 && \
    dnf install -y git cmake ninja-build gcc gcc-c++ vulkan-loader-devel vulkan-tools
 USER 1001
 WORKDIR /locallm
--- a/model_servers/object_detection_python/Makefile
+++ b/model_servers/object_detection_python/Makefile
@ -1,33 +1,33 @@
 APP := object_detection_python
 PORT ?= 8000

-include ../common/Makefile.common
-
-IMAGE_NAME ?= $(REGISTRY_ORG)/$(COMPONENT)/$(APP):latest
-IMAGE := $(REGISTRY)/$(IMAGE_NAME)
-CUDA_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_cuda:latest
-VULKAN_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_vulkan:latest
-
+REGISTRY ?= ghcr.io
+REGISTRY_ORG ?= containers

 MODEL_NAME ?= facebook/detr-resnet-101
-MODELS_DIR := /models
+MODELS_DIR := /app/models

+include ../common/Makefile.common
+
+IMAGE_NAME ?= $(REGISTRY_ORG)/$(APP):latest
+IMAGE := $(REGISTRY)/$(IMAGE_NAME)
+
+# Run override required because of the multi-directory models and model_path vs models_dir
 .PHONY: run
 run:
 	cd ../../models && \
 	podman run -it -d -p $(PORT):$(PORT) -v ./$(MODEL_NAME):$(MODELS_DIR)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) -e MODEL_PATH=$(MODELS_DIR)/$(MODEL_NAME) -e HOST=0.0.0.0 -e PORT=$(PORT) $(IMAGE)

-
 .PHONY: all
 all: build download-model-facebook-detr-resnet-101 run 

 .PHONY: download-model-facebook-detr-resnet-101
 download-model-facebook-detr-resnet-101:
-	cd ../../models/ && \
-	python download_hf_models.py -m facebook/detr-resnet-101
+	cd ../../models && \
+	make download-model-facebook-detr-resnet-101

 .PHONY: test
 test:
-	$(MAKE) download-model-facebook-detr-resnet-101
-	ln -s ../../models/detr-resnet-101 ./
-	PORT=$(PORT) MODEL_NAME=$(MODEL_NAME) MODELS_PATH=$(MODELS_PATH) IMAGE=$(IMAGE) PULL_ALWAYS=0 pytest -s -vvv
+	pip install -r ../../convert_models/requirements.txt
+	cp -r ../../models/facebook ./
+	REGISTRY=$(REGISTRY) MODEL_NAME=$(MODEL_NAME) MODELS_DIR=$(MODELS_DIR) IMAGE_NAME=$(IMAGE_NAME) PORT=$(PORT) pytest -s -vvv
--- a/model_servers/object_detection_python/base/Containerfile
+++ b/model_servers/object_detection_python/base/Containerfile
@ -1,9 +1,8 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 ARG PORT=8000
 WORKDIR /app
-COPY src/requirements.txt .
+COPY src .
 RUN pip install --upgrade pip && \
    pip install --no-cache-dir --upgrade -r requirements.txt
-COPY src/object_detection_server.py .
 EXPOSE $PORT
-ENTRYPOINT [ "uvicorn", "object_detection_server:app", "--host", "0.0.0.0" ]
+ENTRYPOINT [ "sh", "./run.sh" ]
--- a/model_servers/object_detection_python/src/object_detection_server.py
+++ b/model_servers/object_detection_python/src/object_detection_server.py
@ -11,7 +11,7 @@ import shutil


 app = FastAPI()
-model = os.getenv("MODEL_PATH", default="facebook/detr-resnet-101")
+model = os.getenv("MODEL_PATH", default="/app/models/facebook/detr-resnet-101")
 revision = os.getenv("MODEL_REVISION", default="no_timm")

 if os.path.isfile(model):
@ -30,6 +30,10 @@ else:
 class Item(BaseModel):
    image: bytes 

+@app.get("/health")
+def tests_alive():
+    return {"alive": True}
+
@app.post("/detection")
 def detection(item: Item):
    b64_image = item.image
--- a/model_servers/object_detection_python/src/requirements-unlocked.txt
+++ b/model_servers/object_detection_python/src/requirements-unlocked.txt
@ -0,0 +1,8 @@
+fastapi
+pillow
+pydantic
+requests
+transformers
+torch
+uvicorn
+timm
--- a/model_servers/object_detection_python/src/requirements.txt
+++ b/model_servers/object_detection_python/src/requirements.txt
@ -1,36 +1,55 @@
-annotated-types==0.6.0
-anyio==4.3.0
-certifi==2024.2.2
+annotated-types==0.7.0
+anyio==4.4.0
+certifi==2024.6.2
 charset-normalizer==3.3.2
-click==8.1.7
-fastapi==0.110.3
-filelock==3.13.4
-fsspec==2024.3.1
-h11==0.14.0
-huggingface-hub==0.22.2
+click==8.1.8
+dnspython==2.6.1
+email_validator==2.2.0
+fastapi==0.111.1
+fastapi-cli==0.0.7
+filelock==3.15.4
+fsspec==2024.6.1
+h11==0.16.0
+httpcore==1.0.9
+httptools==0.6.4
+httpx==0.27.2
+huggingface-hub==0.23.4
 idna==3.7
-Jinja2==3.1.3
+Jinja2==3.1.6
+markdown-it-py==3.0.0
 MarkupSafe==2.1.5
+mdurl==0.1.2
 mpmath==1.3.0
 networkx==3.3
-numpy==1.26.4
-packaging==24.0
+numpy==2.0.1
+orjson==3.10.18
+packaging==24.1
 pillow==10.3.0
-pydantic==2.7.1
-pydantic_core==2.18.2
-PyYAML==6.0.1
-regex==2024.4.28
-requests==2.31.0
-safetensors==0.4.3
+pydantic==2.7.4
+pydantic_core==2.18.4
+Pygments==2.18.0
+python-dotenv==1.0.1
+python-multipart==0.0.20
+PyYAML==6.0.2
+regex==2024.5.15
+requests==2.32.3
+rich==13.7.1
+safetensors==0.4.5
+shellingham==1.5.4
 sniffio==1.3.1
 starlette==0.37.2
-sympy==1.12
-timm==0.9.16
+sympy==1.12.1
+timm==1.0.15
 tokenizers==0.19.1
-torch==2.3.0
-torchvision==0.18.0
-tqdm==4.66.2
-transformers==4.40.1
-typing_extensions==4.11.0
-urllib3==2.2.1
-uvicorn==0.29.0
+torch==2.3.1
+torchvision==0.18.1
+tqdm==4.66.5
+transformers==4.41.2
+typer==0.12.5
+typing_extensions==4.12.2
+ujson==5.10.0
+urllib3==2.2.3
+uvicorn==0.30.6
+uvloop==0.19.0
+watchfiles==0.22.0
+websockets==12.0
--- a/model_servers/object_detection_python/src/run.sh
+++ b/model_servers/object_detection_python/src/run.sh
@ -0,0 +1,9 @@
+#!/bin/bash
+
+if [ ${MODEL_PATH} ]; then
+    PORT=${PORT} MODEL_PATH=${MODEL_PATH} uvicorn object_detection_server:app --port ${PORT:=8000} --host ${HOST:=0.0.0.0}
+    exit 0
+fi
+
+echo "Please set either a MODEL_PATH"
+exit 1
--- a/model_servers/object_detection_python/tests/init.py
+++ b/model_servers/object_detection_python/tests/init.py
--- a/model_servers/object_detection_python/tests/conftest.py
+++ b/model_servers/object_detection_python/tests/conftest.py
@ -0,0 +1,46 @@
+import pytest_container
+import os
+
+REGISTRY = os.getenv("REGISTRY", "ghcr.io")
+IMAGE_NAME = os.getenv("IMAGE_NAME", "containers/object_detection_python:latest")
+MODEL_NAME = os.getenv("MODEL_NAME", "facebook/detr-resnet-101")
+MODELS_DIR = os.getenv("MODELS_DIR", "/app/models")
+
+MODEL_PATH = f"{MODELS_DIR}/{MODEL_NAME}"
+
+PORT = os.getenv("PORT", 8000)
+if type(PORT) == str:
+    try:
+        PORT = int(PORT)
+    except:
+        PORT = 8000
+
+MS = pytest_container.Container(
+        url=f"containers-storage:{REGISTRY}/{IMAGE_NAME}",
+        volume_mounts=[
+            pytest_container.container.BindMount(
+                container_path=f"{MODEL_PATH}",
+                host_path=f"./{MODEL_NAME}",
+                flags=["ro"]
+            )
+        ],
+        extra_environment_variables={
+            "MODEL_PATH": f"{MODEL_PATH}",
+            "HOST": "0.0.0.0",
+            "PORT": f"{PORT}",
+            "IMAGE_NAME": f"{IMAGE_NAME}",
+            "REGISTRY": f"{REGISTRY}"
+        },
+        forwarded_ports=[
+            pytest_container.PortForwarding(
+                container_port=PORT,
+                host_port=PORT
+            )
+        ],
+    )
+
+def pytest_generate_tests(metafunc):
+    pytest_container.auto_container_parametrize(metafunc)
+
+def pytest_addoption(parser):
+    pytest_container.add_logging_level_options(parser)
--- a/model_servers/object_detection_python/tests/requirements.txt
+++ b/model_servers/object_detection_python/tests/requirements.txt
@ -0,0 +1,8 @@
+pip==24.0
+pytest-container==0.4.0
+pytest-selenium==4.1.0
+pytest-testinfra==10.1.0
+pytest==8.1.1
+requests==2.31.0
+selenium==4.19.0
+tenacity==8.2.3
--- a/model_servers/object_detection_python/tests/test_alive.py
+++ b/model_servers/object_detection_python/tests/test_alive.py
@ -0,0 +1,12 @@
+import pytest_container
+from .conftest import MS
+import tenacity
+
+CONTAINER_IMAGES = [MS]
+
+def test_etc_os_release_present(auto_container: pytest_container.container.ContainerData):
+    assert auto_container.connection.file("/etc/os-release").exists
+
+@tenacity.retry(stop=tenacity.stop_after_attempt(5), wait=tenacity.wait_exponential())
+def test_alive(auto_container: pytest_container.container.ContainerData, host):
+    host.run_expect([0],f"curl http://localhost:{auto_container.forwarded_ports[0].host_port}",).stdout.strip()
--- a/model_servers/whispercpp/base/Containerfile
+++ b/model_servers/whispercpp/base/Containerfile
@ -19,6 +19,10 @@ COPY --from=builder /app /app
 COPY --from=mwader/static-ffmpeg:6.1.1 /ffmpeg /bin/
 COPY --from=mwader/static-ffmpeg:6.1.1 /ffprobe /bin/

-COPY src /app/
+COPY --chown=0:0 --chmod=755 src /app
+RUN chown 1001:1001 /app
+
+USER 1001
+
 ENV AUDIO_FILE=/app/jfk.wav
 ENTRYPOINT ["sh", "run.sh"]
--- a/models/Containerfile
+++ b/models/Containerfile
@ -7,7 +7,7 @@
 #	    https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin
 # podman build --build-arg="MODEL_URL=https://..." -t quay.io/yourimage .
 #
-FROM registry.access.redhat.com/ubi9/ubi-micro:9.3-15
+FROM registry.access.redhat.com/ubi9/ubi-micro:9.4-15

 # Can be substituted using the --build-arg defined above
 ARG MODEL_URL=https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf
--- a/models/Makefile
+++ b/models/Makefile
@ -1,3 +1,4 @@
+CONTAINER_TOOL ?= podman
 MODEL_URL ?= https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf
 MODEL_NAME ?= granite-7b-lab-Q4_K_M.gguf

@ -5,11 +6,11 @@ REGISTRY ?= quay.io
 REGISTRY_ORG ?= ai-lab
 COMPONENT = models

-IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/$(MODEL_NAME):latest
+IMAGE ?= $(shell tr '[:upper:]' '[:lower:]' <<< $(REGISTRY)/$(REGISTRY_ORG)/$(MODEL_NAME):latest)

 .PHONY: build
 build:
-	podman build $(MODEL_URL:%=--build-arg MODEL_URL=%) -f Containerfile -t ${IMAGE} .
+	"${CONTAINER_TOOL}"  build $(MODEL_URL:%=--build-arg MODEL_URL=%) -f Containerfile -t ${IMAGE} .

 .PHONY: download-model
 download-model:
@ -37,6 +38,13 @@ download-model-mistral:
 download-model-mistral-code:
 	$(MAKE) MODEL_NAME=mistral-7b-code-16k-qlora.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Code-16K-qlora-GGUF/resolve/main/mistral-7b-code-16k-qlora.Q4_K_M.gguf download-model

+.PHONY: download-model-facebook-detr-resnet-101
+download-model-facebook-detr-resnet-101:
+	python3 -m pip install -r ../convert_models/requirements.txt
+	cd ../convert_models/ && \
+	python3 download_huggingface.py -m facebook/detr-resnet-101
+	cp -r ../convert_models/converted_models/facebook ./
+
 .PHONY: clean
 clean:
 	-rm -f *tmp
--- a/recipes/audio/audio_to_text/ai-lab.yaml
+++ b/recipes/audio/audio_to_text/ai-lab.yaml
@ -9,7 +9,7 @@ application:
      containerfile: ./base/Containerfile
      model-service: true
      backend:
-        - llama
+        - whisper-cpp
      arch:
        - arm64
        - amd64
--- a/recipes/audio/audio_to_text/app/Containerfile
+++ b/recipes/audio/audio_to_text/app/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY requirements.txt /locallm/requirements.txt
 RUN pip install --upgrade pip && \
--- a/recipes/audio/audio_to_text/app/whisper_client.py
+++ b/recipes/audio/audio_to_text/app/whisper_client.py
@ -8,13 +8,17 @@ st.title(":studio_microphone: Speech Recognition")
 st.markdown("Upload an audio file you wish to have translated")
 endpoint = os.getenv("MODEL_ENDPOINT", default="http://0.0.0.0:8001")
 endpoint = f"{endpoint}/inference"
+endpoint_bearer = os.getenv("MODEL_ENDPOINT_BEARER")
+request_kwargs = {}
+if endpoint_bearer is not None:
+    request_kwargs["headers"] = {"Authorization": f"Bearer {endpoint_bearer}"}
 audio = st.file_uploader("", type=["wav","mp3","mp4","flac"], accept_multiple_files=False)
 # read audio file
 if audio:
    audio_bytes = audio.read()
    st.audio(audio_bytes, format='audio/wav', start_time=0)
-    files = {'file': audio_bytes}
-    response = requests.post(endpoint, files=files)
+    request_kwargs["files"] = {'file': audio_bytes}
+    response = requests.post(endpoint, **request_kwargs)
    response_json = response.json()
    st.subheader(f"Translated Text")
    st.text_area(label="", value=response_json['text'], height=300)
--- a/recipes/common/Makefile.common
+++ b/recipes/common/Makefile.common
@ -14,8 +14,10 @@ DISK_UID ?= $(shell id -u)
 DISK_GID ?= $(shell id -g)
 FROM ?=
 ARCH ?=
+BUILD_ARG_FILE ?=
 CONTAINERFILE ?= Containerfile
 GRAPH_ROOT=$(shell podman info --format '{{ .Store.GraphRoot }}')
+UMASK=$(shell umask)

 ROOTLESS_AUTH_JSON=${XDG_RUNTIME_DIR}/containers/auth.json
 ROOTFUL_AUTH_JSON=/run/containers/0/auth.json
@ -75,12 +77,16 @@ install::

 .PHONY: build
 build:
-	podman build --squash-all $(ARCH:%=--platform linux/%) $(FROM:%=--from %) -t ${APP_IMAGE} app/
+	podman build --squash-all \
+	       $(ARCH:%=--platform linux/%) \
+	       $(BUILD_ARG_FILE:%=--build-arg-file=%) \
+	       $(FROM:%=--from %) -t ${APP_IMAGE} app/

 .PHONY: bootc
 bootc: quadlet growfs
 	podman build \
 	  $(ARCH:%=--arch %) \
+	  $(BUILD_ARG_FILE:%=--build-arg-file=%) \
 	  $(FROM:%=--from %) \
 	  $(AUTH_JSON:%=-v %:/run/containers/0/auth.json) \
 	  --security-opt label=disable \
@ -151,15 +157,21 @@ install-chrome:
 	elif [[ "$(OS)" == "Darwin" ]]; then \
 		open $(CHROME_DOWNLOAD_PATH); \
 		ls "/Volumes/Google Chrome/Google Chrome.app/Contents/MacOS/Google Chrome"; \
-		cp -r "/Volumes/Google Chrome/Google Chrome.app" "$(RECIPE_BINARIES_PATH)/"; \
+		cp -pr "/Volumes/Google Chrome/Google Chrome.app" "$(RECIPE_BINARIES_PATH)/"; \
 		diskutil unmount "/Volumes/Google Chrome" || true; \
 		rm $(CHROME_DOWNLOAD_PATH); \
 	fi;

+.PHONY: check-umask
+check-umask:
+	@test "$(UMASK)" = "0022" || \
+		(echo; echo -n "Error: umask $(UMASK) will cause unexpected behaviour: use umask 022! "; \
+		 echo "Verify the `ai-lab-recipes` git repository was cloned with umask 0022"; exit 1)
+
 .PHONY: growfs
-growfs: quadlet
+growfs: quadlet check-umask
 	# Add growfs service
-	mkdir -p build; cp -R ../../common/usr build/
+	mkdir -p build; cp -pR ../../common/usr build/

 .PHONY: quadlet
 quadlet:
@ -176,7 +188,7 @@ quadlet:
 	    -e "s|MODEL_IMAGE|${MODEL_IMAGE}|g" \
 	    quadlet/${APP}.yaml \
 	    > build/${APP}.yaml
-	cp quadlet/${APP}.kube build/${APP}.kube
+	cp -p quadlet/${APP}.kube build/${APP}.kube

 .PHONY: run
 run: 
--- a/recipes/computer_vision/object_detection/Makefile
+++ b/recipes/computer_vision/object_detection/Makefile
@ -0,0 +1,15 @@
+SHELL := /bin/bash
+APP ?= object_detection_client
+PORT ?= 8501
+MODEL_NAME ?= facebook/detr-resnet-101
+
+include ../../common/Makefile.common
+
+.PHONY: functional-tests
+functional-tests:
+	IMAGE_NAME=${IMAGE_NAME} REGISTRY=${REGISTRY} MODEL_NAME=${MODEL_NAME} pytest -vvv --driver=Chrome --driver-path=$(RECIPE_BINARIES_PATH)/chromedriver ${RELATIVE_TESTS_PATH}/functional
+
+RECIPE_BINARIES_PATH := $(shell realpath ../../common/bin)
+RELATIVE_MODELS_PATH := ../../../models
+RELATIVE_TESTS_PATH := ../tests
+
--- a/recipes/computer_vision/object_detection/README.md
+++ b/recipes/computer_vision/object_detection/README.md
@ -56,11 +56,11 @@ The local Model Service relies on a volume mount to the localhost to access the
 make run
 ```

-As stated above, by default the model service will use [`facebook/detr-resnet-101`](https://huggingface.co/facebook/detr-resnet-101). However you can use other compatabale models. Simply pass the new `MODEL_NAME` and `MODEL_PATH` to the make command. Make sure the model is downloaded and exists in the [models directory](../../../models/):
+As stated above, by default the model service will use [`facebook/detr-resnet-101`](https://huggingface.co/facebook/detr-resnet-101). However you can use other compatible models. Simply pass the new `MODEL_NAME` and `MODEL_PATH` to the make command. Make sure the model is downloaded and exists in the [models directory](../../../models/):

 ```bash
 # from path model_servers/object_detection_python from repo containers/ai-lab-recipes
-make MODEL_NAME=facebook/detr-resnet-50 MODEL_PATH=/models/facebook/detr-resnet-50 run
+make MODEL_NAME=facebook/detr-resnet-50 MODEL_PATH=/models/facebook/detr-resnet-101 run
 ```

 ## Build the AI Application
@ -81,7 +81,7 @@ This could be any appropriately hosted Model Service (running locally or in the
 The following Podman command can be used to run your AI Application:

 ```bash
-podman run -p 8501:8501 -e MODEL_ENDPOINT=http://10.88.0.1:8000/detection object_detection_client
+podman run -p 8501:8501 -e MODEL_ENDPOINT=http://10.88.0.1:8000 object_detection_client
 ```

 ### Interact with the AI Application
--- a/recipes/computer_vision/object_detection/ai-lab.yaml
+++ b/recipes/computer_vision/object_detection/ai-lab.yaml
@ -8,8 +8,8 @@ application:
      contextdir: ../../../model_servers/object_detection_python
      containerfile: ./base/Containerfile
      model-service: true
-      backend: 
-        - torch
+      backend:
+        - pytorch
      arch:
        - arm64
        - amd64
@ -17,7 +17,7 @@ application:
        - 8000
      image: quay.io/redhat-et/locallm-object-detection-server:latest
    - name: object-detection-client
-      contextdir: ./client
+      contextdir: ./app
      containerfile: Containerfile
      arch:
        - arm64
--- a/recipes/computer_vision/object_detection/client/Containerfile
+++ b/recipes/computer_vision/object_detection/client/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY requirements.txt /locallm/requirements.txt
 RUN pip install --upgrade pip && \
--- a/recipes/computer_vision/object_detection/client/object_detection_client.py
+++ b/recipes/computer_vision/object_detection/client/object_detection_client.py
@ -7,8 +7,11 @@ import io

 st.title("🕵️‍♀️ Object Detection")
 endpoint =os.getenv("MODEL_ENDPOINT", default = "http://0.0.0.0:8000")
+endpoint_bearer = os.getenv("MODEL_ENDPOINT_BEARER")
 headers = {"accept": "application/json",
           "Content-Type": "application/json"}
+if endpoint_bearer:
+    headers["Authorization"] = f"Bearer {endpoint_bearer}"
 image = st.file_uploader("Upload Image")
 window = st.empty()

@ -23,6 +26,8 @@ if image:
    window.image(img, use_column_width=True)  
    # convert PIL image into bytes for post request 
    bytes_io = io.BytesIO() 
+    if img.mode in ("RGBA", "P"): 
+        img = img.convert("RGB")
    img.save(bytes_io, "JPEG")
    img_bytes = bytes_io.getvalue()
    b64_image = base64.b64encode(img_bytes).decode('utf-8')
--- a/recipes/computer_vision/object_detection/app/requirements.txt
+++ b/recipes/computer_vision/object_detection/app/requirements.txt
@ -0,0 +1,40 @@
+altair==5.3.0
+attrs==23.2.0
+blinker==1.7.0
+cachetools==5.3.3
+certifi==2024.2.2
+charset-normalizer==3.3.2
+click==8.1.8
+gitdb==4.0.12
+GitPython==3.1.44
+idna==3.7
+Jinja2==3.1.6
+jsonschema==4.21.1
+jsonschema-specifications==2023.12.1
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+mdurl==0.1.2
+numpy==1.26.4
+packaging==24.0
+pandas==2.2.3
+pillow==10.3.0
+protobuf==4.25.3
+pyarrow==15.0.2
+pydeck==0.8.1b0
+Pygments==2.17.2
+python-dateutil==2.9.0.post0
+pytz==2024.1
+referencing==0.34.0
+requests==2.31.0
+rich==13.7.1
+rpds-py==0.18.1
+six==1.16.0
+smmap==5.0.2
+streamlit==1.33.0
+tenacity==8.2.3
+toml==0.10.2
+toolz==0.12.1
+tornado==6.4.2
+typing_extensions==4.11.0
+tzdata==2024.1
+urllib3==2.2.3
--- a/recipes/computer_vision/object_detection/client/requirements.txt
+++ b/recipes/computer_vision/object_detection/client/requirements.txt
@ -1,3 +0,0 @@
-streamlit
-requests
-pillow
--- a/recipes/computer_vision/tests/conftest.py
+++ b/recipes/computer_vision/tests/conftest.py
@ -0,0 +1,8 @@
+import pytest
+import os
+
+
+@pytest.fixture
+def chrome_options(chrome_options):
+    chrome_options.add_argument("--headless")
+    return chrome_options
--- a/recipes/computer_vision/tests/functional/init.py
+++ b/recipes/computer_vision/tests/functional/init.py
--- a/recipes/computer_vision/tests/functional/conftest.py
+++ b/recipes/computer_vision/tests/functional/conftest.py
@ -0,0 +1,58 @@
+import pytest_container
+import os
+import logging
+
+REGISTRY=os.environ['REGISTRY']
+IMAGE_NAME=os.environ['IMAGE_NAME']
+MODEL_NAME=os.environ['MODEL_NAME']
+
+logging.info("""
+Starting pytest with the following ENV vars:
+    REGISTRY: {REGISTRY}
+    IMAGE_NAME: {IMAGE_NAME}
+    MODEL_NAME: {MODEL_NAME}
+For:
+    model_server: whispercpp
+""".format(REGISTRY=REGISTRY, IMAGE_NAME=IMAGE_NAME, MODEL_NAME=MODEL_NAME))
+
+
+MS = pytest_container.Container(
+        url=f"containers-storage:{REGISTRY}/{IMAGE_NAME}",
+        volume_mounts=[
+            pytest_container.container.BindMount(
+                container_path=f"/locallm/models/${MODEL_NAME}",
+                host_path=f"./{MODEL_NAME}",
+                flags=["ro"]
+            )
+        ],
+        extra_environment_variables={
+            "MODEL_PATH": f"/locall/models/{MODEL_NAME}",
+            "HOST": "0.0.0.0",
+            "PORT": "8001"
+        },
+        forwarded_ports=[
+            pytest_container.PortForwarding(
+                container_port=8001,
+                host_port=8001
+            )
+        ],
+    )
+
+CB = pytest_container.Container(
+        url=f"containers-storage:{os.environ['REGISTRY']}/containers/{os.environ['IMAGE_NAME']}",
+        extra_environment_variables={
+            "MODEL_ENDPOINT": "http://10.88.0.1:8001"
+        },
+        forwarded_ports=[
+            pytest_container.PortForwarding(
+                container_port=8501,
+                host_port=8501
+            )
+        ],
+    )
+
+def pytest_generate_tests(metafunc):
+    pytest_container.auto_container_parametrize(metafunc)
+
+def pytest_addoption(parser):
+    pytest_container.add_logging_level_options(parser)
--- a/recipes/computer_vision/tests/functional/test_app.py
+++ b/recipes/computer_vision/tests/functional/test_app.py
@ -0,0 +1,17 @@
+import pytest_container
+from .conftest import CB
+import tenacity
+
+CONTAINER_IMAGES = [CB]
+
+def test_etc_os_release_present(auto_container: pytest_container.container.ContainerData):
+    assert auto_container.connection.file("/etc/os-release").exists
+
+@tenacity.retry(stop=tenacity.stop_after_attempt(5), wait=tenacity.wait_exponential())
+def test_alive(auto_container: pytest_container.container.ContainerData, host):
+    host.run_expect([0],f"curl http://localhost:{auto_container.forwarded_ports[0].host_port}",).stdout.strip()
+
+def test_title(auto_container: pytest_container.container.ContainerData, selenium):
+    selenium.get(f"http://localhost:{auto_container.forwarded_ports[0].host_port}")
+    assert selenium.title == "Streamlit"
+
--- a/recipes/computer_vision/tests/integration/init.py
+++ b/recipes/computer_vision/tests/integration/init.py
--- a/recipes/computer_vision/tests/integration/conftest.py
+++ b/recipes/computer_vision/tests/integration/conftest.py
@ -0,0 +1,7 @@
+import os
+import pytest
+
+
+@pytest.fixture()
+def url():
+    return os.environ["URL"]
--- a/recipes/computer_vision/tests/integration/test_app.py
+++ b/recipes/computer_vision/tests/integration/test_app.py
@ -0,0 +1,3 @@
+def test_title(url,selenium):
+    selenium.get(f"http://{url}:8501")
+    assert selenium.title == "Streamlit"
--- a/recipes/computer_vision/tests/requirements.txt
+++ b/recipes/computer_vision/tests/requirements.txt
@ -0,0 +1,8 @@
+pip==24.0
+pytest-container==0.4.0
+pytest-selenium==4.1.0
+pytest-testinfra==10.1.0
+pytest==8.1.1
+requests==2.31.0
+selenium==4.19.0
+tenacity==8.2.3
--- a/recipes/multimodal/image_understanding/ai-lab.yaml
+++ b/recipes/multimodal/image_understanding/ai-lab.yaml
@ -8,7 +8,7 @@ application:
      containerfile: ./base/Containerfile
      model-service: true
      backend:
-        - llama
+        - llama-cpp
      arch:
        - arm64
        - amd64
--- a/recipes/multimodal/image_understanding/app/Containerfile
+++ b/recipes/multimodal/image_understanding/app/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /image_understanding
 COPY requirements.txt .
 RUN pip install --upgrade pip && \
--- a/recipes/natural_language_processing/agents/Makefile
+++ b/recipes/natural_language_processing/agents/Makefile
@ -0,0 +1,9 @@
+SHELL := /bin/bash
+APP ?= react_agent
+PORT ?= 8501
+
+include ../../common/Makefile.common
+
+RECIPE_BINARIES_PATH := $(shell realpath ../../common/bin)
+RELATIVE_MODELS_PATH := ../../../models
+RELATIVE_TESTS_PATH := ../tests
--- a/recipes/natural_language_processing/agents/README.md
+++ b/recipes/natural_language_processing/agents/README.md
@ -0,0 +1,182 @@
+# ReAct Agent Application
+
+This recipe demonstrates the ReAct (Reasoning and Acting) framework in action through a music exploration application. ReAct enables AI to think step-by-step about tasks, take appropriate actions, and provide reasoned responses. The application shows how ReAct can be used to create an intelligent music discovery assistant that combines reasoning with Spotify API interactions.
+
+The application utilizes [`llama-cpp-python`](https://github.com/abetlen/llama-cpp-python) for the Model Service and integrates with Spotify's API for music data. The recipe uses [Langchain](https://python.langchain.com/docs/get_started/introduction) for the ReAct implementation and [Streamlit](https://streamlit.io/) for the UI layer.
+
+## Spotify API Access
+To use this application, you'll need Spotify API credentials:
+- Create a Spotify Developer account
+- Create an application in the Spotify Developer Dashboard
+- Get your Client ID and Client Secret
+
+These can be provided through environment variables or the application's UI.
+
+## Try the ReAct Agent Application
+The [Podman Desktop](https://podman-desktop.io) [AI Lab Extension](https://github.com/containers/podman-desktop-extension-ai-lab) includes this recipe among others. To try it out, open `Recipes Catalog` -> `ReAct Agent` and follow the instructions to start the application.
+
+# Build the Application
+
+The rest of this document will explain how to build and run the application from the terminal, and will
+go into greater detail on how each container in the Pod above is built, run, and 
+what purpose it serves in the overall application. All the recipes use a central [Makefile](../../common/Makefile.common) that includes variables populated with default values to simplify getting started. Please review the [Makefile docs](../../common/README.md), to learn about further customizing your application.
+
+
+This application requires a model, a model service and an AI inferencing application.
+
+* [Quickstart](#quickstart)
+* [Download a model](#download-a-model)
+* [Build the Model Service](#build-the-model-service)
+* [Deploy the Model Service](#deploy-the-model-service)
+* [Build the AI Application](#build-the-ai-application)
+* [Deploy the AI Application](#deploy-the-ai-application)
+* [Interact with the AI Application](#interact-with-the-ai-application)
+* [Embed the AI Application in a Bootable Container Image](#embed-the-ai-application-in-a-bootable-container-image)
+
+
+## Quickstart
+To run the application with pre-built images from `quay.io/ai-lab`, use `make quadlet`. This command
+builds the application's metadata and generates Kubernetes YAML at `./build/chatbot.yaml` to spin up a Pod that can then be launched locally.
+Try it with:
+
+```
+make quadlet
+podman kube play build/chatbot.yaml
+```
+
+This will take a few minutes if the model and model-server container images need to be downloaded. 
+The Pod is named `chatbot`, so you may use [Podman](https://podman.io) to manage the Pod and its containers:
+
+```
+podman pod list
+podman ps
+```
+
+Once the Pod and its containers are running, the application can be accessed at `http://localhost:8501`. However, if you started the app via the podman desktop UI, a random port will be assigned instead of `8501`. Please use the AI App Details `Open AI App` button to access it instead. 
+Please refer to the section below for more details about [interacting with the chatbot application](#interact-with-the-ai-application).
+
+To stop and remove the Pod, run:
+
+```
+podman pod stop chatbot
+podman pod rm chatbot
+```
+
+## Download a model
+
+If you are just getting started, we recommend using [granite-7b-lab](https://huggingface.co/instructlab/granite-7b-lab). This is a well
+performant mid-sized model with an apache-2.0 license. In order to use it with our Model Service we need it converted
+and quantized into the [GGUF format](https://github.com/ggerganov/ggml/blob/master/docs/gguf.md). There are a number of
+ways to get a GGUF version of granite-7b-lab, but the simplest is to download a pre-converted one from
+[huggingface.co](https://huggingface.co) here: https://huggingface.co/instructlab/granite-7b-lab-GGUF.
+
+The recommended model can be downloaded using the code snippet below:
+
+```bash
+cd ../../../models
+curl -sLO https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf
+cd ../recipes/natural_language_processing/chatbot
+```
+
+_A full list of supported open models is forthcoming._  
+
+
+## Build the Model Service
+
+The complete instructions for building and deploying the Model Service can be found in the
+[llamacpp_python model-service document](../../../model_servers/llamacpp_python/README.md).
+
+The Model Service can be built from make commands from the [llamacpp_python directory](../../../model_servers/llamacpp_python/).
+
+```bash
+# from path model_servers/llamacpp_python from repo containers/ai-lab-recipes
+make build
+```
+Checkout the [Makefile](../../../model_servers/llamacpp_python/Makefile) to get more details on different options for how to build.
+
+## Deploy the Model Service
+
+The local Model Service relies on a volume mount to the localhost to access the model files. It also employs environment variables to dictate the model used and where its served. You can start your local Model Service using the following `make` command from `model_servers/llamacpp_python` set with reasonable defaults:
+
+```bash
+# from path model_servers/llamacpp_python from repo containers/ai-lab-recipes
+make run
+```
+
+## Build the AI Application
+
+The AI Application can be built from the make command:
+
+```bash
+# Run this from the current directory (path recipes/natural_language_processing/chatbot from repo containers/ai-lab-recipes)
+make build
+```
+
+## Deploy the AI Application
+
+Make sure the Model Service is up and running before starting this container image. When starting the AI Application container image we need to direct it to the correct `MODEL_ENDPOINT`. This could be any appropriately hosted Model Service (running locally or in the cloud) using an OpenAI compatible API. In our case the Model Service is running inside the Podman machine so we need to provide it with the appropriate address `10.88.0.1`. To deploy the AI application use the following:
+
+```bash
+# Run this from the current directory (path recipes/natural_language_processing/chatbot from repo containers/ai-lab-recipes)
+make run 
+```
+
+## Interact with the AI Application
+
+Everything should now be up an running with the chat application available at [`http://localhost:8501`](http://localhost:8501). By using this recipe and getting this starting point established, users should now have an easier time customizing and building their own LLM enabled chatbot applications.   
+
+## Embed the AI Application in a Bootable Container Image
+
+To build a bootable container image that includes this sample chatbot workload as a service that starts when a system is booted, run: `make -f Makefile bootc`. You can optionally override the default image / tag you want to give the make command by specifying it as follows: `make -f Makefile BOOTC_IMAGE=<your_bootc_image> bootc`.
+
+Substituting the bootc/Containerfile FROM command is simple using the Makefile FROM option.
+
+```bash
+make FROM=registry.redhat.io/rhel9/rhel-bootc:9.4 bootc
+```
+
+Selecting the ARCH for the bootc/Containerfile is simple using the Makefile ARCH= variable.
+
+```
+make ARCH=x86_64 bootc
+```
+
+The magic happens when you have a bootc enabled system running. If you do, and you'd like to update the operating system to the OS you just built
+with the chatbot application, it's as simple as ssh-ing into the bootc system and running:
+
+```bash
+bootc switch quay.io/ai-lab/chatbot-bootc:latest
+```
+
+Upon a reboot, you'll see that the chatbot service is running on the system. Check on the service with:
+
+```bash
+ssh user@bootc-system-ip
+sudo systemctl status chatbot
+```
+
+### What are bootable containers?
+
+What's a [bootable OCI container](https://containers.github.io/bootc/) and what's it got to do with AI?
+
+That's a good question! We think it's a good idea to embed AI workloads (or any workload!) into bootable images at _build time_ rather than
+at _runtime_. This extends the benefits, such as portability and predictability, that containerizing applications provides to the operating system.
+Bootable OCI images bake exactly what you need to run your workloads into the operating system at build time by using your favorite containerization
+tools. Might I suggest [podman](https://podman.io/)?
+
+Once installed, a bootc enabled system can be updated by providing an updated bootable OCI image from any OCI
+image registry with a single `bootc` command. This works especially well for fleets of devices that have fixed workloads - think
+factories or appliances. Who doesn't want to add a little AI to their appliance, am I right?
+
+Bootable images lend toward immutable operating systems, and the more immutable an operating system is, the less that can go wrong at runtime!
+
+#### Creating bootable disk images
+
+You can convert a bootc image to a bootable disk image using the
+[quay.io/centos-bootc/bootc-image-builder](https://github.com/osbuild/bootc-image-builder) container image.
+
+This container image allows you to build and deploy [multiple disk image types](../../common/README_bootc_image_builder.md) from bootc container images.
+
+Default image types can be set via the DISK_TYPE Makefile variable.
+
+`make bootc-image-builder DISK_TYPE=ami`
--- a/recipes/natural_language_processing/agents/ai-lab.yaml
+++ b/recipes/natural_language_processing/agents/ai-lab.yaml
@ -0,0 +1,27 @@
+version: v1.0
+application:
+  type: language
+  name: ReAct_Agent_Streamlit
+  description: ReAct framework implementation with Spotify API integration in a web frontend
+  containers:
+    - name: llamacpp-server
+      contextdir: ../../../model_servers/llamacpp_python
+      containerfile: ./base/Containerfile
+      model-service: true
+      backend:
+        - llama-cpp
+      arch:
+        - arm64
+        - amd64
+      ports:
+        - 8001
+      image: quay.io/ai-lab/llamacpp_python:latest
+    - name: streamlit-react-agent-app
+      contextdir: app
+      containerfile: Containerfile
+      arch:
+        - arm64
+        - amd64
+      ports:
+        - 8501
+      image: quay.io/ai-lab/react-agent:latest
--- a/recipes/natural_language_processing/agents/app/Containerfile
+++ b/recipes/natural_language_processing/agents/app/Containerfile
@ -0,0 +1,8 @@
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
+WORKDIR /agents
+COPY requirements.txt .
+RUN pip install --upgrade pip
+RUN pip install --no-cache-dir --upgrade -r /agents/requirements.txt
+COPY *.py .
+EXPOSE 8501
+ENTRYPOINT [ "streamlit", "run", "react-agent-app.py" ]
--- a/recipes/natural_language_processing/agents/app/react-agent-app.py
+++ b/recipes/natural_language_processing/agents/app/react-agent-app.py
@ -0,0 +1,386 @@
+import os
+from typing import Dict, List
+import requests
+import time
+import json
+import streamlit as st
+from langchain_core.tools import BaseTool
+from langchain_openai import ChatOpenAI
+from langchain_core.prompts import ChatPromptTemplate
+from langchain_core.messages import AIMessage, HumanMessage
+from dotenv import load_dotenv
+from typing import Any, List, Dict, Union
+
+# Load env file
+load_dotenv()
+
+# Model service
+model_service = os.getenv("MODEL_ENDPOINT", "http://localhost:8001")
+model_service = f"{model_service}/v1"
+
+# Spotify API Configuration
+SPOTIFY_BASE_URL = "https://api.spotify.com/v1"
+
+class SpotifyAPI:
+    def __init__(self):
+        self.client_id = os.getenv("SPOTIFY_CLIENT_ID")
+        self.client_secret = os.getenv("SPOTIFY_CLIENT_SECRET")
+        
+        # If not in .env, access it through UI
+        if not self.client_id or not self.client_secret:
+            if hasattr(st.session_state, 'spotify_client_id') and hasattr(st.session_state, 'spotify_client_secret'):
+                self.client_id = st.session_state.spotify_client_id
+                self.client_secret = st.session_state.spotify_client_secret
+            
+        if not self.client_id or not self.client_secret:
+            raise ValueError("Spotify credentials not found. Please provide them in the sidebar.")
+            
+        self.access_token = self._get_access_token()
+
+    def _get_access_token(self):
+        """Get Spotify access token using client credentials flow"""
+        auth_url = "https://accounts.spotify.com/api/token"
+        auth_response = requests.post(
+            auth_url,
+            data={
+                "grant_type": "client_credentials",
+                "client_id": self.client_id,
+                "client_secret": self.client_secret,
+            }
+        )
+        
+        if auth_response.status_code != 200:
+            raise Exception("Failed to get access token")
+            
+        return auth_response.json()["access_token"]
+
+    def search_playlists(self, query: str, limit: int = 5) -> Dict:
+        """Search for playlists using Spotify API"""
+        enhanced_query = f"{query} playlist top popular"
+        headers = {
+            "Authorization": f"Bearer {self.access_token}",
+            "Content-Type": "application/json"
+        }
+        params = {
+           "q": enhanced_query,
+            "type": "playlist",
+            "limit": limit,
+            "market": "US"
+        }
+        
+        response = requests.get(
+            f"{SPOTIFY_BASE_URL}/search",
+            headers=headers,
+            params=params
+        )
+        
+        if response.status_code != 200:
+            raise Exception(f"Search failed: {response.json().get('error', {}).get('message')}")
+            
+        return response.json()
+    
+    def get_trending_tracks(self, location: str = None, limit: int = 10) -> Dict:
+        """Get trending tracks for a specific location"""
+        headers = {
+            "Authorization": f"Bearer {self.access_token}",
+            "Content-Type": "application/json"
+        }
+        #include location in query
+        query = f"top charts popular {location}" if location else "top charts"
+
+        params = {
+            "q": query,
+            "type": "track",
+            "limit": limit,
+            "market": "US",
+            "offset": 0,
+            "include_external": "audio"
+        }
+        
+        response = requests.get(
+            f"{SPOTIFY_BASE_URL}/search",
+            headers=headers,
+            params=params
+        )
+        
+        if response.status_code != 200:
+            raise Exception(f"Search failed: {response.json().get('error', {}).get('message')}")
+            
+        return response.json()
+
+class SpotifySearchTool(BaseTool):
+    name: str = "spotify_search"
+    description: str = """
+    Search for playlists on Spotify.
+    Input should be a search query string.
+    The tool will return relevant playlists with their details.
+    """
+    spotify: Any = None
+
+    def __init__(self) -> None:
+        super().__init__()
+        self.spotify = SpotifyAPI()
+    
+    def _run(self, query: str) -> List[Dict]:
+        try:
+            results = self.spotify.search_playlists(query)
+            playlists = []
+            for item in results['playlists']['items']:
+                playlist = {
+                    'name': item['name'],
+                    'description': item['description'],
+                    'tracks_total': item['tracks']['total'],
+                    'url': item['external_urls']['spotify'],
+                    'owner': item['owner']['display_name'],
+                    'followers': item['followers']['total'] if 'followers' in item else 0
+                }
+                playlists.append(playlist)
+            return playlists
+        except Exception as e:
+            return f"Error searching Spotify: {str(e)}"
+        
+class SpotifyTrendingTool(BaseTool):
+    name: str = "spotify_trending"
+    description: str = """
+    Get trending tracks for a specific location on Spotify.
+    Input should be a location string (e.g., 'Berkeley', 'Bay Area').
+    Returns top trending tracks in that area.
+    """
+    spotify: Any = None
+
+    def __init__(self) -> None:
+        super().__init__()
+        self.spotify = SpotifyAPI()
+    
+    def _run(self, location: str) -> List[Dict]:
+        try:
+            results = self.spotify.get_trending_tracks(location)
+            tracks = []
+            for item in results['tracks']['items']:
+                track = {
+                    'name': item['name'],
+                    'artist': ', '.join([artist['name'] for artist in item['artists']]),
+                    'album': item['album']['name'],
+                    'url': item['external_urls']['spotify'],
+                    'popularity': item['popularity']
+                }
+                tracks.append(track)
+            return tracks
+        except Exception as e:
+            return f"Error getting trending tracks: {str(e)}"
+
+def format_spotify_response(tool_responses: Dict) -> str:
+    """Format the Spotify API responses into a readable message"""
+    response = ""
+    
+    # Format trending tracks
+    trending_tracks = tool_responses.get("trending", [])
+    if isinstance(trending_tracks, list) and trending_tracks:
+        response += "📊 Trending Tracks:\n"
+        for i, track in enumerate(trending_tracks[:5], 1):
+            response += f"{i}. {track['name']} by {track['artist']}\n"
+            response += f"   - Album: {track['album']}\n"
+            response += f"   - Listen: {track['url']}\n\n"
+    else:
+        response += "📊 No trending tracks found for this location.\n\n"
+    
+    # Format playlists
+    playlists = tool_responses.get("playlists", [])
+    if isinstance(playlists, list) and playlists:
+        response += "🎵 Related Playlists:\n"
+        for i, playlist in enumerate(playlists[:3], 1):
+            response += f"{i}. {playlist['name']}\n"
+            response += f"   - Tracks: {playlist['tracks_total']}\n"
+            response += f"   - Description: {playlist['description']}\n"
+            response += f"   - Listen: {playlist['url']}\n\n"
+    else:
+        response += "No related playlists found.\n"
+    
+    return response
+
+# Model service check
+@st.cache_resource(show_spinner=False)
+def checking_model_service():
+    start = time.time()
+    print("Checking Model Service Availability...")
+    ready = False
+    while not ready:
+        try:
+            request_cpp = requests.get(f'{model_service}/models')
+            request_ollama = requests.get(f'{model_service[:-2]}api/tags')
+            if request_cpp.status_code == 200:
+                server = "Llamacpp_Python"
+                ready = True
+            elif request_ollama.status_code == 200:
+                server = "Ollama"
+                ready = True        
+        except:
+            pass
+        time.sleep(1)
+    print(f"{server} Model Service Available")
+    print(f"Time taken: {time.time()-start} seconds")
+    return server
+
+def get_models():
+    try:
+        response = requests.get(f"{model_service[:-2]}api/tags")
+        return [i["name"].split(":")[0] for i in json.loads(response.content)["models"]]
+    except:
+        return None
+
+# ReAct prompt template
+REACT_PROMPT = """You are a helpful assistant that can search for music on Spotify.
+You have access to the following tools:
+
+{tools}
+
+Use the following format in your internal processing:
+Thought: First interpret if the user's input is a casual greeting or an actual search query. 
+If it seems like a greeting, respond conversationally and suggest some current trending tracks.
+If it's a search query, use it directly.
+
+Action: tool_name (either spotify_search or spotify_trending)
+Action Input: input to the tool
+Observation: tool's response
+
+Final Answer: If the input was conversational, start with a greeting before showing the music results.
+Then provide results in this format:
+
+📊 Trending Tracks:
+[formatted tracks...]
+
+🎵 Related Playlists:
+[formatted playlists...]
+"""
+
+# Create ReAct Agent function
+def create_react_agent(model_name: str):
+    llm = ChatOpenAI(
+        base_url=model_service,
+        api_key="sk-no-key-required",
+        model=model_name,
+        streaming=True
+    )
+    
+    # Create both tools
+    playlist_tool = SpotifySearchTool()
+    trending_tool = SpotifyTrendingTool()
+    
+    prompt = ChatPromptTemplate.from_messages([
+        ("system", REACT_PROMPT),
+        ("human", "{input}")
+    ])
+    
+    chain = prompt | llm
+    
+    return chain, [playlist_tool, trending_tool]
+
+#Streamlit
+st.title("🎵 Spotify Playlist Explorer")
+
+if "spotify_credentials_set" not in st.session_state:
+    st.session_state.spotify_credentials_set = False
+
+# Spotify Credentials Management in Sidebar
+with st.sidebar:
+    st.markdown("### Spotify Credentials")
+    
+    # Check if credentials exist in environment variables
+    env_credentials_exist = bool(os.getenv("SPOTIFY_CLIENT_ID")) and bool(os.getenv("SPOTIFY_CLIENT_SECRET"))
+    
+    if not env_credentials_exist:
+        st.warning("Spotify credentials not found in environment variables.")
+        
+        # Initialize session state for credentials
+        if "spotify_client_id" not in st.session_state:
+            st.session_state.spotify_client_id = ""
+        if "spotify_client_secret" not in st.session_state:
+            st.session_state.spotify_client_secret = ""
+        
+        # Input fields for credentials
+        client_id = st.text_input(
+            "Enter Spotify Client ID",
+            value=st.session_state.spotify_client_id,
+            type="password"
+        )
+        client_secret = st.text_input(
+            "Enter Spotify Client Secret",
+            value=st.session_state.spotify_client_secret,
+            type="password"
+        )
+        
+        if st.button("Save Credentials"):
+            st.session_state.spotify_client_id = client_id
+            st.session_state.spotify_client_secret = client_secret
+            st.session_state.spotify_credentials_set = True
+            st.success("Credentials saved!")
+            st.rerun()  
+    else:
+        st.success("Using credentials from environment variables")
+        st.session_state.spotify_credentials_set = True
+
+# Check if credentials are available before proceeding
+credentials_available = env_credentials_exist or st.session_state.spotify_credentials_set
+
+if not credentials_available:
+    st.error("Please provide Spotify credentials in the sidebar to continue.")
+else:
+    
+    with st.spinner("Checking Model Service Availability..."):
+        server = checking_model_service()
+
+    model_name = os.getenv("MODEL_NAME", "")
+    if server == "Ollama":
+        with st.sidebar:
+            model_name = st.radio(
+                label="Select Model",
+                options=get_models()
+            )
+
+    try:
+        agent, tools = create_react_agent(model_name)
+        playlist_tool, trending_tool = tools
+
+        if "messages" not in st.session_state:
+            st.session_state.messages = []
+
+        for message in st.session_state.messages:
+            with st.chat_message(message["role"]):
+                st.markdown(message["content"])
+
+        if prompt := st.chat_input("What kind of playlists are you looking for?"):
+            st.session_state.messages.append({"role": "user", "content": prompt})
+            
+            with st.chat_message("user"):
+                st.markdown(prompt)
+            
+            with st.chat_message("assistant"):
+                try:
+                    tool_responses = {
+                        "playlists": playlist_tool._run(prompt),
+                        "trending": trending_tool._run(prompt)
+                    }
+                    
+                    agent_response = agent.invoke({
+                        "input": prompt,
+                        "tools": [tool.description for tool in tools],
+                        "query": prompt,
+                        "observation": tool_responses,
+                        "answer": "Based on the search results, here's what I found:"
+                    })
+                    
+                    with st.expander("See thinking process"):
+                        st.markdown(agent_response.content)
+                    
+                    formatted_response = format_spotify_response(tool_responses)
+                    st.markdown(formatted_response)
+                    
+                    st.session_state.messages.append({
+                        "role": "assistant",
+                        "content": formatted_response
+                    })
+                except Exception as e:
+                    error_message = f"Error processing request: {str(e)}"
+                    st.error(error_message)
+    except Exception as e:
+        st.error(f"Error initializing Spotify API: {str(e)}")
--- a/recipes/natural_language_processing/agents/app/requirements.txt
+++ b/recipes/natural_language_processing/agents/app/requirements.txt
@ -0,0 +1,10 @@
+streamlit>=1.24.0
+langchain-core>=0.1.0
+langchain-openai>=0.0.5
+python-dotenv>=0.19.0
+
+requests>=2.31.0
+
+typing-extensions>=4.5.0
+
+streamlit-chat>=0.1.1
--- a/recipes/natural_language_processing/chatbot-java-quarkus/README.md
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/README.md
@ -0,0 +1,9 @@
+# Java-based chatbot application - Quarkus
+
+This application implements a simple chatbot backed by Quarkus and its
+LangChain4j extension. The UI communicates with the backend application via
+web sockets and the backend uses the OpenAI API to talk to the model served
+by Podman AI Lab.
+
+Documentation for Quarkus+LangChain4j can be found at
+https://docs.quarkiverse.io/quarkus-langchain4j/dev/.
--- a/recipes/natural_language_processing/chatbot-java-quarkus/ai-lab.yaml
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/ai-lab.yaml
@ -0,0 +1,26 @@
+version: v1.0
+application:
+  type: language
+  name: ChatBot_Java_Quarkus
+  description: Chatbot sample based on Quarkus
+  containers:
+    - name: llamacpp-server
+      contextdir: ../../../model_servers/llamacpp_python
+      containerfile: ./base/Containerfile
+      model-service: true
+      backend:
+        - llama-cpp
+      arch:
+        - arm64
+        - amd64
+      ports:
+        - 8001
+      image: quay.io/ai-lab/llamacpp_python:latest
+    - name: quarkus-chat-app
+      contextdir: app
+      containerfile: Containerfile
+      arch:
+        - arm64
+        - amd64
+      ports:
+        - 8080
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/.mvn/wrapper/maven-wrapper.properties
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/.mvn/wrapper/maven-wrapper.properties
@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+wrapperVersion=3.3.2
+distributionType=only-script
+distributionUrl=https://repo.maven.apache.org/maven2/org/apache/maven/apache-maven/3.9.10/apache-maven-3.9.10-bin.zip
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/Containerfile
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/Containerfile
@ -0,0 +1,7 @@
+FROM registry.access.redhat.com/ubi8/openjdk-21:latest
+WORKDIR /app
+COPY --chown=185:0 --chmod=744 . .
+RUN mvn package
+EXPOSE 8080
+ENV JAVA_OPTS="-Dquarkus.http.host=0.0.0.0 -Djava.util.logging.manager=org.jboss.logmanager.LogManager"
+ENV JAVA_APP_JAR="/app/target/quarkus-app/quarkus-run.jar"
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/mvnw
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/mvnw
@ -0,0 +1,259 @@
+#!/bin/sh
+# ----------------------------------------------------------------------------
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+# ----------------------------------------------------------------------------
+
+# ----------------------------------------------------------------------------
+# Apache Maven Wrapper startup batch script, version 3.3.2
+#
+# Optional ENV vars
+# -----------------
+#   JAVA_HOME - location of a JDK home dir, required when download maven via java source
+#   MVNW_REPOURL - repo url base for downloading maven distribution
+#   MVNW_USERNAME/MVNW_PASSWORD - user and password for downloading maven
+#   MVNW_VERBOSE - true: enable verbose log; debug: trace the mvnw script; others: silence the output
+# ----------------------------------------------------------------------------
+
+set -euf
+[ "${MVNW_VERBOSE-}" != debug ] || set -x
+
+# OS specific support.
+native_path() { printf %s\\n "$1"; }
+case "$(uname)" in
+CYGWIN* | MINGW*)
+  [ -z "${JAVA_HOME-}" ] || JAVA_HOME="$(cygpath --unix "$JAVA_HOME")"
+  native_path() { cygpath --path --windows "$1"; }
+  ;;
+esac
+
+# set JAVACMD and JAVACCMD
+set_java_home() {
+  # For Cygwin and MinGW, ensure paths are in Unix format before anything is touched
+  if [ -n "${JAVA_HOME-}" ]; then
+    if [ -x "$JAVA_HOME/jre/sh/java" ]; then
+      # IBM's JDK on AIX uses strange locations for the executables
+      JAVACMD="$JAVA_HOME/jre/sh/java"
+      JAVACCMD="$JAVA_HOME/jre/sh/javac"
+    else
+      JAVACMD="$JAVA_HOME/bin/java"
+      JAVACCMD="$JAVA_HOME/bin/javac"
+
+      if [ ! -x "$JAVACMD" ] || [ ! -x "$JAVACCMD" ]; then
+        echo "The JAVA_HOME environment variable is not defined correctly, so mvnw cannot run." >&2
+        echo "JAVA_HOME is set to \"$JAVA_HOME\", but \"\$JAVA_HOME/bin/java\" or \"\$JAVA_HOME/bin/javac\" does not exist." >&2
+        return 1
+      fi
+    fi
+  else
+    JAVACMD="$(
+      'set' +e
+      'unset' -f command 2>/dev/null
+      'command' -v java
+    )" || :
+    JAVACCMD="$(
+      'set' +e
+      'unset' -f command 2>/dev/null
+      'command' -v javac
+    )" || :
+
+    if [ ! -x "${JAVACMD-}" ] || [ ! -x "${JAVACCMD-}" ]; then
+      echo "The java/javac command does not exist in PATH nor is JAVA_HOME set, so mvnw cannot run." >&2
+      return 1
+    fi
+  fi
+}
+
+# hash string like Java String::hashCode
+hash_string() {
+  str="${1:-}" h=0
+  while [ -n "$str" ]; do
+    char="${str%"${str#?}"}"
+    h=$(((h * 31 + $(LC_CTYPE=C printf %d "'$char")) % 4294967296))
+    str="${str#?}"
+  done
+  printf %x\\n $h
+}
+
+verbose() { :; }
+[ "${MVNW_VERBOSE-}" != true ] || verbose() { printf %s\\n "${1-}"; }
+
+die() {
+  printf %s\\n "$1" >&2
+  exit 1
+}
+
+trim() {
+  # MWRAPPER-139:
+  #   Trims trailing and leading whitespace, carriage returns, tabs, and linefeeds.
+  #   Needed for removing poorly interpreted newline sequences when running in more
+  #   exotic environments such as mingw bash on Windows.
+  printf "%s" "${1}" | tr -d '[:space:]'
+}
+
+# parse distributionUrl and optional distributionSha256Sum, requires .mvn/wrapper/maven-wrapper.properties
+while IFS="=" read -r key value; do
+  case "${key-}" in
+  distributionUrl) distributionUrl=$(trim "${value-}") ;;
+  distributionSha256Sum) distributionSha256Sum=$(trim "${value-}") ;;
+  esac
+done <"${0%/*}/.mvn/wrapper/maven-wrapper.properties"
+[ -n "${distributionUrl-}" ] || die "cannot read distributionUrl property in ${0%/*}/.mvn/wrapper/maven-wrapper.properties"
+
+case "${distributionUrl##*/}" in
+maven-mvnd-*bin.*)
+  MVN_CMD=mvnd.sh _MVNW_REPO_PATTERN=/maven/mvnd/
+  case "${PROCESSOR_ARCHITECTURE-}${PROCESSOR_ARCHITEW6432-}:$(uname -a)" in
+  *AMD64:CYGWIN* | *AMD64:MINGW*) distributionPlatform=windows-amd64 ;;
+  :Darwin*x86_64) distributionPlatform=darwin-amd64 ;;
+  :Darwin*arm64) distributionPlatform=darwin-aarch64 ;;
+  :Linux*x86_64*) distributionPlatform=linux-amd64 ;;
+  *)
+    echo "Cannot detect native platform for mvnd on $(uname)-$(uname -m), use pure java version" >&2
+    distributionPlatform=linux-amd64
+    ;;
+  esac
+  distributionUrl="${distributionUrl%-bin.*}-$distributionPlatform.zip"
+  ;;
+maven-mvnd-*) MVN_CMD=mvnd.sh _MVNW_REPO_PATTERN=/maven/mvnd/ ;;
+*) MVN_CMD="mvn${0##*/mvnw}" _MVNW_REPO_PATTERN=/org/apache/maven/ ;;
+esac
+
+# apply MVNW_REPOURL and calculate MAVEN_HOME
+# maven home pattern: ~/.m2/wrapper/dists/{apache-maven-<version>,maven-mvnd-<version>-<platform>}/<hash>
+[ -z "${MVNW_REPOURL-}" ] || distributionUrl="$MVNW_REPOURL$_MVNW_REPO_PATTERN${distributionUrl#*"$_MVNW_REPO_PATTERN"}"
+distributionUrlName="${distributionUrl##*/}"
+distributionUrlNameMain="${distributionUrlName%.*}"
+distributionUrlNameMain="${distributionUrlNameMain%-bin}"
+MAVEN_USER_HOME="${MAVEN_USER_HOME:-${HOME}/.m2}"
+MAVEN_HOME="${MAVEN_USER_HOME}/wrapper/dists/${distributionUrlNameMain-}/$(hash_string "$distributionUrl")"
+
+exec_maven() {
+  unset MVNW_VERBOSE MVNW_USERNAME MVNW_PASSWORD MVNW_REPOURL || :
+  exec "$MAVEN_HOME/bin/$MVN_CMD" "$@" || die "cannot exec $MAVEN_HOME/bin/$MVN_CMD"
+}
+
+if [ -d "$MAVEN_HOME" ]; then
+  verbose "found existing MAVEN_HOME at $MAVEN_HOME"
+  exec_maven "$@"
+fi
+
+case "${distributionUrl-}" in
+*?-bin.zip | *?maven-mvnd-?*-?*.zip) ;;
+*) die "distributionUrl is not valid, must match *-bin.zip or maven-mvnd-*.zip, but found '${distributionUrl-}'" ;;
+esac
+
+# prepare tmp dir
+if TMP_DOWNLOAD_DIR="$(mktemp -d)" && [ -d "$TMP_DOWNLOAD_DIR" ]; then
+  clean() { rm -rf -- "$TMP_DOWNLOAD_DIR"; }
+  trap clean HUP INT TERM EXIT
+else
+  die "cannot create temp dir"
+fi
+
+mkdir -p -- "${MAVEN_HOME%/*}"
+
+# Download and Install Apache Maven
+verbose "Couldn't find MAVEN_HOME, downloading and installing it ..."
+verbose "Downloading from: $distributionUrl"
+verbose "Downloading to: $TMP_DOWNLOAD_DIR/$distributionUrlName"
+
+# select .zip or .tar.gz
+if ! command -v unzip >/dev/null; then
+  distributionUrl="${distributionUrl%.zip}.tar.gz"
+  distributionUrlName="${distributionUrl##*/}"
+fi
+
+# verbose opt
+__MVNW_QUIET_WGET=--quiet __MVNW_QUIET_CURL=--silent __MVNW_QUIET_UNZIP=-q __MVNW_QUIET_TAR=''
+[ "${MVNW_VERBOSE-}" != true ] || __MVNW_QUIET_WGET='' __MVNW_QUIET_CURL='' __MVNW_QUIET_UNZIP='' __MVNW_QUIET_TAR=v
+
+# normalize http auth
+case "${MVNW_PASSWORD:+has-password}" in
+'') MVNW_USERNAME='' MVNW_PASSWORD='' ;;
+has-password) [ -n "${MVNW_USERNAME-}" ] || MVNW_USERNAME='' MVNW_PASSWORD='' ;;
+esac
+
+if [ -z "${MVNW_USERNAME-}" ] && command -v wget >/dev/null; then
+  verbose "Found wget ... using wget"
+  wget ${__MVNW_QUIET_WGET:+"$__MVNW_QUIET_WGET"} "$distributionUrl" -O "$TMP_DOWNLOAD_DIR/$distributionUrlName" || die "wget: Failed to fetch $distributionUrl"
+elif [ -z "${MVNW_USERNAME-}" ] && command -v curl >/dev/null; then
+  verbose "Found curl ... using curl"
+  curl ${__MVNW_QUIET_CURL:+"$__MVNW_QUIET_CURL"} -f -L -o "$TMP_DOWNLOAD_DIR/$distributionUrlName" "$distributionUrl" || die "curl: Failed to fetch $distributionUrl"
+elif set_java_home; then
+  verbose "Falling back to use Java to download"
+  javaSource="$TMP_DOWNLOAD_DIR/Downloader.java"
+  targetZip="$TMP_DOWNLOAD_DIR/$distributionUrlName"
+  cat >"$javaSource" <<-END
+	public class Downloader extends java.net.Authenticator
+	{
+	  protected java.net.PasswordAuthentication getPasswordAuthentication()
+	  {
+	    return new java.net.PasswordAuthentication( System.getenv( "MVNW_USERNAME" ), System.getenv( "MVNW_PASSWORD" ).toCharArray() );
+	  }
+	  public static void main( String[] args ) throws Exception
+	  {
+	    setDefault( new Downloader() );
+	    java.nio.file.Files.copy( java.net.URI.create( args[0] ).toURL().openStream(), java.nio.file.Paths.get( args[1] ).toAbsolutePath().normalize() );
+	  }
+	}
+	END
+  # For Cygwin/MinGW, switch paths to Windows format before running javac and java
+  verbose " - Compiling Downloader.java ..."
+  "$(native_path "$JAVACCMD")" "$(native_path "$javaSource")" || die "Failed to compile Downloader.java"
+  verbose " - Running Downloader.java ..."
+  "$(native_path "$JAVACMD")" -cp "$(native_path "$TMP_DOWNLOAD_DIR")" Downloader "$distributionUrl" "$(native_path "$targetZip")"
+fi
+
+# If specified, validate the SHA-256 sum of the Maven distribution zip file
+if [ -n "${distributionSha256Sum-}" ]; then
+  distributionSha256Result=false
+  if [ "$MVN_CMD" = mvnd.sh ]; then
+    echo "Checksum validation is not supported for maven-mvnd." >&2
+    echo "Please disable validation by removing 'distributionSha256Sum' from your maven-wrapper.properties." >&2
+    exit 1
+  elif command -v sha256sum >/dev/null; then
+    if echo "$distributionSha256Sum  $TMP_DOWNLOAD_DIR/$distributionUrlName" | sha256sum -c >/dev/null 2>&1; then
+      distributionSha256Result=true
+    fi
+  elif command -v shasum >/dev/null; then
+    if echo "$distributionSha256Sum  $TMP_DOWNLOAD_DIR/$distributionUrlName" | shasum -a 256 -c >/dev/null 2>&1; then
+      distributionSha256Result=true
+    fi
+  else
+    echo "Checksum validation was requested but neither 'sha256sum' or 'shasum' are available." >&2
+    echo "Please install either command, or disable validation by removing 'distributionSha256Sum' from your maven-wrapper.properties." >&2
+    exit 1
+  fi
+  if [ $distributionSha256Result = false ]; then
+    echo "Error: Failed to validate Maven distribution SHA-256, your Maven distribution might be compromised." >&2
+    echo "If you updated your Maven version, you need to update the specified distributionSha256Sum property." >&2
+    exit 1
+  fi
+fi
+
+# unzip and move
+if command -v unzip >/dev/null; then
+  unzip ${__MVNW_QUIET_UNZIP:+"$__MVNW_QUIET_UNZIP"} "$TMP_DOWNLOAD_DIR/$distributionUrlName" -d "$TMP_DOWNLOAD_DIR" || die "failed to unzip"
+else
+  tar xzf${__MVNW_QUIET_TAR:+"$__MVNW_QUIET_TAR"} "$TMP_DOWNLOAD_DIR/$distributionUrlName" -C "$TMP_DOWNLOAD_DIR" || die "failed to untar"
+fi
+printf %s\\n "$distributionUrl" >"$TMP_DOWNLOAD_DIR/$distributionUrlNameMain/mvnw.url"
+mv -- "$TMP_DOWNLOAD_DIR/$distributionUrlNameMain" "$MAVEN_HOME" || [ -d "$MAVEN_HOME" ] || die "fail to move MAVEN_HOME"
+
+clean || :
+exec_maven "$@"
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/mvnw.cmd
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/mvnw.cmd
@ -0,0 +1,149 @@
+<# : batch portion
+@REM ----------------------------------------------------------------------------
+@REM Licensed to the Apache Software Foundation (ASF) under one
+@REM or more contributor license agreements.  See the NOTICE file
+@REM distributed with this work for additional information
+@REM regarding copyright ownership.  The ASF licenses this file
+@REM to you under the Apache License, Version 2.0 (the
+@REM "License"); you may not use this file except in compliance
+@REM with the License.  You may obtain a copy of the License at
+@REM
+@REM    http://www.apache.org/licenses/LICENSE-2.0
+@REM
+@REM Unless required by applicable law or agreed to in writing,
+@REM software distributed under the License is distributed on an
+@REM "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+@REM KIND, either express or implied.  See the License for the
+@REM specific language governing permissions and limitations
+@REM under the License.
+@REM ----------------------------------------------------------------------------
+
+@REM ----------------------------------------------------------------------------
+@REM Apache Maven Wrapper startup batch script, version 3.3.2
+@REM
+@REM Optional ENV vars
+@REM   MVNW_REPOURL - repo url base for downloading maven distribution
+@REM   MVNW_USERNAME/MVNW_PASSWORD - user and password for downloading maven
+@REM   MVNW_VERBOSE - true: enable verbose log; others: silence the output
+@REM ----------------------------------------------------------------------------
+
+@IF "%__MVNW_ARG0_NAME__%"=="" (SET __MVNW_ARG0_NAME__=%~nx0)
+@SET __MVNW_CMD__=
+@SET __MVNW_ERROR__=
+@SET __MVNW_PSMODULEP_SAVE=%PSModulePath%
+@SET PSModulePath=
+@FOR /F "usebackq tokens=1* delims==" %%A IN (`powershell -noprofile "& {$scriptDir='%~dp0'; $script='%__MVNW_ARG0_NAME__%'; icm -ScriptBlock ([Scriptblock]::Create((Get-Content -Raw '%~f0'))) -NoNewScope}"`) DO @(
+  IF "%%A"=="MVN_CMD" (set __MVNW_CMD__=%%B) ELSE IF "%%B"=="" (echo %%A) ELSE (echo %%A=%%B)
+)
+@SET PSModulePath=%__MVNW_PSMODULEP_SAVE%
+@SET __MVNW_PSMODULEP_SAVE=
+@SET __MVNW_ARG0_NAME__=
+@SET MVNW_USERNAME=
+@SET MVNW_PASSWORD=
+@IF NOT "%__MVNW_CMD__%"=="" (%__MVNW_CMD__% %*)
+@echo Cannot start maven from wrapper >&2 && exit /b 1
+@GOTO :EOF
+: end batch / begin powershell #>
+
+$ErrorActionPreference = "Stop"
+if ($env:MVNW_VERBOSE -eq "true") {
+  $VerbosePreference = "Continue"
+}
+
+# calculate distributionUrl, requires .mvn/wrapper/maven-wrapper.properties
+$distributionUrl = (Get-Content -Raw "$scriptDir/.mvn/wrapper/maven-wrapper.properties" | ConvertFrom-StringData).distributionUrl
+if (!$distributionUrl) {
+  Write-Error "cannot read distributionUrl property in $scriptDir/.mvn/wrapper/maven-wrapper.properties"
+}
+
+switch -wildcard -casesensitive ( $($distributionUrl -replace '^.*/','') ) {
+  "maven-mvnd-*" {
+    $USE_MVND = $true
+    $distributionUrl = $distributionUrl -replace '-bin\.[^.]*$',"-windows-amd64.zip"
+    $MVN_CMD = "mvnd.cmd"
+    break
+  }
+  default {
+    $USE_MVND = $false
+    $MVN_CMD = $script -replace '^mvnw','mvn'
+    break
+  }
+}
+
+# apply MVNW_REPOURL and calculate MAVEN_HOME
+# maven home pattern: ~/.m2/wrapper/dists/{apache-maven-<version>,maven-mvnd-<version>-<platform>}/<hash>
+if ($env:MVNW_REPOURL) {
+  $MVNW_REPO_PATTERN = if ($USE_MVND) { "/org/apache/maven/" } else { "/maven/mvnd/" }
+  $distributionUrl = "$env:MVNW_REPOURL$MVNW_REPO_PATTERN$($distributionUrl -replace '^.*'+$MVNW_REPO_PATTERN,'')"
+}
+$distributionUrlName = $distributionUrl -replace '^.*/',''
+$distributionUrlNameMain = $distributionUrlName -replace '\.[^.]*$','' -replace '-bin$',''
+$MAVEN_HOME_PARENT = "$HOME/.m2/wrapper/dists/$distributionUrlNameMain"
+if ($env:MAVEN_USER_HOME) {
+  $MAVEN_HOME_PARENT = "$env:MAVEN_USER_HOME/wrapper/dists/$distributionUrlNameMain"
+}
+$MAVEN_HOME_NAME = ([System.Security.Cryptography.MD5]::Create().ComputeHash([byte[]][char[]]$distributionUrl) | ForEach-Object {$_.ToString("x2")}) -join ''
+$MAVEN_HOME = "$MAVEN_HOME_PARENT/$MAVEN_HOME_NAME"
+
+if (Test-Path -Path "$MAVEN_HOME" -PathType Container) {
+  Write-Verbose "found existing MAVEN_HOME at $MAVEN_HOME"
+  Write-Output "MVN_CMD=$MAVEN_HOME/bin/$MVN_CMD"
+  exit $?
+}
+
+if (! $distributionUrlNameMain -or ($distributionUrlName -eq $distributionUrlNameMain)) {
+  Write-Error "distributionUrl is not valid, must end with *-bin.zip, but found $distributionUrl"
+}
+
+# prepare tmp dir
+$TMP_DOWNLOAD_DIR_HOLDER = New-TemporaryFile
+$TMP_DOWNLOAD_DIR = New-Item -Itemtype Directory -Path "$TMP_DOWNLOAD_DIR_HOLDER.dir"
+$TMP_DOWNLOAD_DIR_HOLDER.Delete() | Out-Null
+trap {
+  if ($TMP_DOWNLOAD_DIR.Exists) {
+    try { Remove-Item $TMP_DOWNLOAD_DIR -Recurse -Force | Out-Null }
+    catch { Write-Warning "Cannot remove $TMP_DOWNLOAD_DIR" }
+  }
+}
+
+New-Item -Itemtype Directory -Path "$MAVEN_HOME_PARENT" -Force | Out-Null
+
+# Download and Install Apache Maven
+Write-Verbose "Couldn't find MAVEN_HOME, downloading and installing it ..."
+Write-Verbose "Downloading from: $distributionUrl"
+Write-Verbose "Downloading to: $TMP_DOWNLOAD_DIR/$distributionUrlName"
+
+$webclient = New-Object System.Net.WebClient
+if ($env:MVNW_USERNAME -and $env:MVNW_PASSWORD) {
+  $webclient.Credentials = New-Object System.Net.NetworkCredential($env:MVNW_USERNAME, $env:MVNW_PASSWORD)
+}
+[Net.ServicePointManager]::SecurityProtocol = [Net.SecurityProtocolType]::Tls12
+$webclient.DownloadFile($distributionUrl, "$TMP_DOWNLOAD_DIR/$distributionUrlName") | Out-Null
+
+# If specified, validate the SHA-256 sum of the Maven distribution zip file
+$distributionSha256Sum = (Get-Content -Raw "$scriptDir/.mvn/wrapper/maven-wrapper.properties" | ConvertFrom-StringData).distributionSha256Sum
+if ($distributionSha256Sum) {
+  if ($USE_MVND) {
+    Write-Error "Checksum validation is not supported for maven-mvnd. `nPlease disable validation by removing 'distributionSha256Sum' from your maven-wrapper.properties."
+  }
+  Import-Module $PSHOME\Modules\Microsoft.PowerShell.Utility -Function Get-FileHash
+  if ((Get-FileHash "$TMP_DOWNLOAD_DIR/$distributionUrlName" -Algorithm SHA256).Hash.ToLower() -ne $distributionSha256Sum) {
+    Write-Error "Error: Failed to validate Maven distribution SHA-256, your Maven distribution might be compromised. If you updated your Maven version, you need to update the specified distributionSha256Sum property."
+  }
+}
+
+# unzip and move
+Expand-Archive "$TMP_DOWNLOAD_DIR/$distributionUrlName" -DestinationPath "$TMP_DOWNLOAD_DIR" | Out-Null
+Rename-Item -Path "$TMP_DOWNLOAD_DIR/$distributionUrlNameMain" -NewName $MAVEN_HOME_NAME | Out-Null
+try {
+  Move-Item -Path "$TMP_DOWNLOAD_DIR/$MAVEN_HOME_NAME" -Destination $MAVEN_HOME_PARENT | Out-Null
+} catch {
+  if (! (Test-Path -Path "$MAVEN_HOME" -PathType Container)) {
+    Write-Error "fail to move MAVEN_HOME"
+  }
+} finally {
+  try { Remove-Item $TMP_DOWNLOAD_DIR -Recurse -Force | Out-Null }
+  catch { Write-Warning "Cannot remove $TMP_DOWNLOAD_DIR" }
+}
+
+Write-Output "MVN_CMD=$MAVEN_HOME/bin/$MVN_CMD"
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/pom.xml
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/pom.xml
@ -0,0 +1,138 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <groupId>org.example</groupId>
+    <artifactId>podman-ai-sample-chatbot-quarkus</artifactId>
+    <name>Quarkus-based chatbot sample</name>
+    <version>1.0-SNAPSHOT</version>
+
+    <properties>
+        <compiler-plugin.version>3.13.0</compiler-plugin.version>
+        <maven.compiler.parameters>true</maven.compiler.parameters>
+        <maven.compiler.release>17</maven.compiler.release>
+        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+        <project.reporting.outputEncoding>UTF-8</project.reporting.outputEncoding>
+        <quarkus.platform.artifact-id>quarkus-bom</quarkus.platform.artifact-id>
+        <quarkus.platform.group-id>io.quarkus</quarkus.platform.group-id>
+        <quarkus.platform.version>3.15.1</quarkus.platform.version>
+        <skipITs>true</skipITs>
+        <surefire-plugin.version>3.2.5</surefire-plugin.version>
+        <quarkus-langchain4j.version>0.21.0</quarkus-langchain4j.version>
+    </properties>
+
+    <dependencyManagement>
+        <dependencies>
+            <dependency>
+                <groupId>${quarkus.platform.group-id}</groupId>
+                <artifactId>${quarkus.platform.artifact-id}</artifactId>
+                <version>${quarkus.platform.version}</version>
+                <type>pom</type>
+                <scope>import</scope>
+            </dependency>
+        </dependencies>
+    </dependencyManagement>
+
+    <dependencies>
+        <dependency>
+            <groupId>io.quarkus</groupId>
+            <artifactId>quarkus-rest-jackson</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>io.quarkus</groupId>
+            <artifactId>quarkus-websockets-next</artifactId>
+        </dependency>
+        <dependency>
+            <groupId>io.quarkiverse.langchain4j</groupId>
+            <artifactId>quarkus-langchain4j-openai</artifactId>
+            <version>${quarkus-langchain4j.version}</version>
+        </dependency>
+
+        <!-- UI -->
+        <dependency>
+            <groupId>io.mvnpm</groupId>
+            <artifactId>importmap</artifactId>
+            <version>1.0.11</version>
+        </dependency>
+        <dependency>
+            <groupId>org.mvnpm</groupId>
+            <artifactId>lit</artifactId>
+            <version>3.2.1</version>
+            <scope>runtime</scope>
+        </dependency>
+        <dependency>
+            <groupId>org.mvnpm</groupId>
+            <artifactId>wc-chatbot</artifactId>
+            <version>0.2.1</version>
+            <scope>runtime</scope>
+        </dependency>
+    </dependencies>
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>io.quarkus</groupId>
+                <artifactId>quarkus-maven-plugin</artifactId>
+                <version>${quarkus.platform.version}</version>
+                <executions>
+                    <execution>
+                        <goals>
+                            <goal>build</goal>
+                        </goals>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <version>${compiler-plugin.version}</version>
+            </plugin>
+            <plugin>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <version>3.5.3</version>
+                <configuration>
+                    <systemPropertyVariables>
+                        <java.util.logging.manager>org.jboss.logmanager.LogManager</java.util.logging.manager>
+                        <maven.home>${maven.home}</maven.home>
+                    </systemPropertyVariables>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+
+    <profiles>
+        <profile>
+            <id>native</id>
+            <activation>
+                <property>
+                    <name>native</name>
+                </property>
+            </activation>
+            <build>
+                <plugins>
+                    <plugin>
+                        <artifactId>maven-failsafe-plugin</artifactId>
+                        <version>3.5.3</version>
+                        <executions>
+                            <execution>
+                                <goals>
+                                    <goal>integration-test</goal>
+                                    <goal>verify</goal>
+                                </goals>
+                                <configuration>
+                                    <systemPropertyVariables>
+                                        <native.image.path>${project.build.directory}/${project.build.finalName}-runner</native.image.path>
+                                        <java.util.logging.manager>org.jboss.logmanager.LogManager</java.util.logging.manager>
+                                        <maven.home>${maven.home}</maven.home>
+                                    </systemPropertyVariables>
+                                </configuration>
+                            </execution>
+                        </executions>
+                    </plugin>
+                </plugins>
+            </build>
+            <properties>
+                <quarkus.package.type>native</quarkus.package.type>
+            </properties>
+        </profile>
+    </profiles>
+
+</project>
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/Bot.java
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/Bot.java
@ -0,0 +1,15 @@
+package io.quarkiverse.langchain4j.sample.chatbot;
+
+import dev.langchain4j.service.SystemMessage;
+import dev.langchain4j.service.UserMessage;
+import io.quarkiverse.langchain4j.RegisterAiService;
+import io.smallrye.mutiny.Multi;
+import jakarta.enterprise.context.SessionScoped;
+
+@RegisterAiService
+@SessionScoped
+public interface Bot {
+
+    Multi<String> chat(@UserMessage String question);
+
+}
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/ChatBotWebSocket.java
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/ChatBotWebSocket.java
@ -0,0 +1,23 @@
+package io.quarkiverse.langchain4j.sample.chatbot;
+
+import io.quarkus.websockets.next.OnOpen;
+import io.quarkus.websockets.next.OnTextMessage;
+import io.quarkus.websockets.next.WebSocket;
+import io.smallrye.mutiny.Multi;
+
+@WebSocket(path = "/chatbot")
+public class ChatBotWebSocket {
+
+    private final Bot bot;
+
+    public ChatBotWebSocket(Bot bot) {
+        this.bot = bot;
+    }
+
+    @OnTextMessage
+    public Multi<String> onMessage(String message) {
+        return bot.chat(message).onFailure().recoverWithItem(t ->
+                "There was an error in communicating with the model server");
+    }
+
+}
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/ImportmapResource.java
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/java/io/quarkiverse/langchain4j/sample/chatbot/ImportmapResource.java
@ -0,0 +1,51 @@
+package io.quarkiverse.langchain4j.sample.chatbot;
+
+import jakarta.annotation.PostConstruct;
+import jakarta.enterprise.context.ApplicationScoped;
+import jakarta.ws.rs.GET;
+import jakarta.ws.rs.Path;
+import jakarta.ws.rs.Produces;
+
+import io.mvnpm.importmap.Aggregator;
+
+/**
+ * Dynamically create the import map
+ */
+@ApplicationScoped
+@Path("/_importmap")
+public class ImportmapResource {
+    private String importmap;
+
+    // See https://github.com/WICG/import-maps/issues/235
+    // This does not seem to be supported by browsers yet...
+    @GET
+    @Path("/dynamic.importmap")
+    @Produces("application/importmap+json")
+    public String importMap() {
+        return this.importmap;
+    }
+
+    @GET
+    @Path("/dynamic-importmap.js")
+    @Produces("application/javascript")
+    public String importMapJson() {
+        return JAVASCRIPT_CODE.formatted(this.importmap);
+    }
+
+    @PostConstruct
+    void init() {
+        Aggregator aggregator = new Aggregator();
+        // Add our own mappings
+        aggregator.addMapping("icons/", "/icons/");
+        aggregator.addMapping("components/", "/components/");
+        aggregator.addMapping("fonts/", "/fonts/");
+        this.importmap = aggregator.aggregateAsJson();
+    }
+
+    private static final String JAVASCRIPT_CODE = """
+            const im = document.createElement('script');
+            im.type = 'importmap';
+            im.textContent = JSON.stringify(%s);
+            document.currentScript.after(im);
+            """;
+}
--- a/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/resources/META-INF/resources/components/demo-chat.js
+++ b/recipes/natural_language_processing/chatbot-java-quarkus/app/src/main/resources/META-INF/resources/components/demo-chat.js
@ -0,0 +1,64 @@
+import {css, LitElement} from 'lit';
+
+export class DemoChat extends LitElement {
+
+    _stripHtml(html)   {
+        const div = document.createElement("div");
+        div.innerHTML = html;
+        return div.textContent || div.innerText || "";
+    }
+
+    connectedCallback() {
+        const chatBot = document.getElementsByTagName("chat-bot")[0];
+
+        const protocol = (window.location.protocol === 'https:') ? 'wss' : 'ws';
+        const socket = new WebSocket(protocol + '://' + window.location.host + '/chatbot');
+
+        const that = this;
+        socket.onmessage = function (event) {
+            chatBot.hideLastLoading();
+            // LLM response
+            let lastMessage;
+            if (chatBot.messages.length > 0) {
+                lastMessage = chatBot.messages[chatBot.messages.length - 1];
+            }
+            if (lastMessage && lastMessage.sender.name === "Bot"  && ! lastMessage.loading) {
+                if (! lastMessage.msg) {
+                    lastMessage.msg = "";
+                }
+                lastMessage.msg += event.data;
+                let bubbles = chatBot.shadowRoot.querySelectorAll("chat-bubble");
+                let bubble = bubbles.item(bubbles.length - 1);
+                if (lastMessage.message) {
+                    bubble.innerHTML = that._stripHtml(lastMessage.message) + lastMessage.msg;
+                } else {
+                    bubble.innerHTML = lastMessage.msg;
+                }
+                chatBot.body.scrollTo({ top: chatBot.body.scrollHeight, behavior: 'smooth' })
+            } else {
+                chatBot.sendMessage(event.data, {
+                    right: false,
+                    sender: {
+                        name: "Bot"
+                    }
+                });
+            }
+        }
+
+        chatBot.addEventListener("sent", function (e) {
+            if (e.detail.message.sender.name !== "Bot") {
+                // User message
+                const msg = that._stripHtml(e.detail.message.message);
+                socket.send(msg);
+                chatBot.sendMessage("", {
+                    right: false,
+                    loading: true
+                });
+            }
+        });
+    }
+
+
+}
+
+customElements.define('demo-chat', DemoChat);
--- a/Show More
+++ b/Show More