fix(deps): update auto merged updates (#880 )

Signed-off-by: Platform Engineering Bot <platform-engineering@redhat.com>
fix(deps): update auto merged updates (#879 )
2025-06-09 08:44:36 +03:00 · 2025-06-02 08:05:13 +03:00 · 2025-05-26 09:24:49 +03:00 · 2025-05-21 13:44:14 +02:00 · 2025-05-21 10:13:51 +02:00 · 2025-05-19 16:28:47 +02:00
393 changed files with 59513 additions and 818 deletions
--- a/.devcontainer/Containerfile
+++ b/.devcontainer/Containerfile
@ -1,4 +1,4 @@
-FROM quay.io/containers/podman:v4.9.4
+FROM quay.io/containers/podman:v5.0.2

 USER root

--- a/.github/renovate.json5
+++ b/.github/renovate.json5
@ -1,6 +0,0 @@
-{
-  "$schema": "https://docs.renovatebot.com/renovate-schema.json",
-  "extends": [
-    "github>platform-engineering-org/.github"
-  ]
-}
--- a/.github/workflows/README.md
+++ b/.github/workflows/README.md
@ -0,0 +1,33 @@
+# AI-Lab Recipes Infrastructure Documentation
+
+## Standard Wofklows
+
+Our standard workflows deal with building components and pushing their images to `quay.io/ai-lab`. These components include:
+    - recipe applications:
+        - Chatbot
+        - Codegen
+        - Summarizer
+        - RAG
+    - model_servers
+    - models
+    - instructlab workflows
+    - training bootc workflows
+
+For a full list of the images we build check out or [quay organization](https://quay.io/organization/ai-lab). These standard workflows should all be run against our standard repo `containers/ai-labs-recipes` rather than the mirror repo.
+
+## Testing frameworks
+
+Our testing frameworks are a bit different from our standard workflows. In terms of compute, some of these jobs run either AWS machines provisioned via terraform using secrets in the github repository, or customized github hosted action runners, as well as the standard ubuntu-24.04 github runners for jobs not requiring additional resources.
+
+These workflows start by checking out the [terraform-test-environment-module](https://github.com/containers/terraform-test-environment-module) repo, as well as the code in `containers/ai-lab-recipes` at the `main` branch. Then it will provision the terraform instance, install the correct ansible playbook requirements, and runs a coressponding playbook. Aditional actions may also be taken depending on the testing framework in question.
+
+Finally all of our testing framework workflows will call `terraform destroy` to remove the aws instance we have provisioned and publish the results of the workflow to slack.
+
+IMPORTATNT: If you are doing development and testing, please make sure that instances in AWS are spun down before leaving if you have access to the AWS account.
+
+### training-e2e
+
+The test environment is initially based off of `Fedroa 40`. 
+It bootstraps a `g5.8xlarge` AWS EC2 instance with Terraform.
+Provisioning is executed with ansible. The ansible playbook is invoking bootc install and
+reboots the instance.
--- a/.github/workflows/chatbot.yaml
+++ b/.github/workflows/chatbot.yaml
@ -8,6 +8,8 @@ on:
      - ./recipes/common/Makefile.common
      - ./recipes/natural_language_processing/chatbot/**
      - .github/workflows/chatbot.yaml
+      - ./recipes/natural_language_processing/chatbot/app/**
+      - ./renovate.json
  push:
    branches:
      - main
@ -23,9 +25,9 @@ env:
  IMAGE_NAME: chatbot

 jobs:
-  build-and-push-image:
+  chatbot-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,13 +37,69 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
+
+      - name: Install opentelemetry dependencies
+        run: |
+          pip install --no-cache-dir opentelemetry-sdk opentelemetry-exporter-otlp opentelemetry-instrumentation
+
+      - name: Download OpenTelemetry Collector Contrib
+        run: |
+          wget https://github.com/open-telemetry/opentelemetry-collector-releases/releases/download/v0.103.0/otelcol-contrib_0.103.0_linux_amd64.tar.gz
+          tar -xvf otelcol-contrib_0.103.0_linux_amd64.tar.gz
+
+      - name: Write secrets to files
+        run: |
+          echo "${{ secrets.ROSA_OTEL_CACERT }}" > /tmp/ca.crt
+          echo "${{ secrets.ROSA_OTEL_SERVER_CRT }}" > /tmp/server.crt
+          echo "${{ secrets.ROSA_OTEL_SERVER_KEY }}" > /tmp/server.key
+
+      - name: Configure OpenTelemetry Collector
+        run: |
+          echo '
+            receivers:
+              otlp:
+                protocols:
+                  grpc:
+                  http:
+            exporters:
+              otlphttp:
+                endpoint: "${{ secrets.ROSA_OTEL_ENDPOINT }}"
+                tls:
+                  insecure: false
+                  cert_file: /tmp/server.crt
+                  key_file: /tmp/server.key
+                  ca_file: /tmp/ca.crt
+              debug:
+                verbosity: detailed
+            service:
+              pipelines:
+                traces:
+                  receivers: [otlp]
+                  exporters: [debug, otlphttp]
+          ' > otel-collector-config.yaml
+
+      - name: Run OpenTelemetry Collector
+        run: |
+          ./otelcol-contrib --config otel-collector-config.yaml > otel-collector.log 2>&1 &

      - name: Install qemu dependency
        run: |
          sudo apt-get update
          sudo apt-get install -y qemu-user-static

+      - name: Start job trace
+        run: |
+          export WORKFLOW_NAME="chatbot"
+          export JOB_NAME="chatbot-build-and-push"
+          export TRACE_ACTION="start"
+          python ci/trace-steps.py
+
      - name: Build Image
        id: build_image
        uses: redhat-actions/buildah-build@v2.13
@ -52,18 +110,13 @@ jobs:
          containerfiles: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app/Containerfile
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install Dependencies
        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
        run: make install

      - name: Download model
-        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
-        run: make download-model-mistral
+        working-directory: ./models
+        run: make download-model-granite

      - name: Run Functional Tests
        shell: bash
@ -86,3 +139,11 @@ jobs:
          image: ${{ steps.build_image.outputs.image }}
          tags: ${{ steps.build_image.outputs.tags }}
          registry: ${{ env.REGISTRY }}
+
+      - name: End job trace
+        run: |
+          export WORKFLOW_NAME="chatbot"
+          export JOB_NAME="chatbot-build-and-push"
+          export TRACE_ACTION="end"
+          python ci/trace-steps.py
+
--- a/.github/workflows/codegen.yaml
+++ b/.github/workflows/codegen.yaml
@ -23,9 +23,9 @@ env:
  IMAGE_NAME: codegen

 jobs:
-  build-and-push-image:
+  codegen-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,7 +35,7 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -53,7 +53,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

@ -62,8 +62,8 @@ jobs:
        run: make install

      - name: Download model
-        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
-        run: make download-model-mistral
+        working-directory: ./models
+        run: make download-model-mistral-code

      - name: Run Functional Tests
        shell: bash
--- a/.github/workflows/instructlab.yaml
+++ b/.github/workflows/instructlab.yaml
@ -0,0 +1,79 @@
+name: Instructlab image builds
+
+on:
+  schedule: # schedule the job to run at 12 AM daily
+   - cron: '0 0 * * *'
+
+  # pull_request:
+  #   branches:
+  #     - main
+  #   paths:
+  #     - .github/workflows/instructlab_baseimages_build_push.yaml
+  #     - training/nvidia
+  # push:
+  #   branches:
+  #     - main
+  #   paths:
+  #     - .github/workflows/instructlab_baseimages_build_push.yaml
+  #     - training/nvidia
+  
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}
+  cancel-in-progress: false
+
+env:
+  REGISTRY: ghcr.io
+  REGISTRY_ORG: containers
+
+jobs:
+  instructlab-nvidia:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests') && github.repository == 'containers-mirror/ai-lab-recipes'"
+    strategy:
+      matrix:
+        include:
+          - make_target: nvidia
+          - make_target: amd
+    runs-on: ubuntu-latest
+    # runs-on: ubuntu-22.04-2core # starting with minimal option
+    steps:
+      - name: Remove unnecessary files
+        run: |
+          sudo rm -rf /usr/share/dotnet
+          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+
+      - uses: actions/checkout@v4.1.7
+      
+      - name: Build Image
+        id: build_image
+        run: make ${{ matrix.make_target}}
+        working-directory: ./training/instructlab
+
+      - name: Login to Container Registry
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/podman-login@v1.7
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ secrets.REGISTRY_USER }}
+          password: ${{ secrets.REGISTRY_PASSWORD }}
+
+      - name: Push image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ steps.build_image.outputs.image }}
+          tags: ${{ steps.build_image.outputs.tags }}
+          registry: ${{ env.REGISTRY }}
+
+      - name: Publish Job Results to Slack
+        id: slack
+        if: always()
+        uses: slackapi/slack-github-action@v1.26.0
+        with:
+          payload: |
+            {
+              "text": "${{ github.workflow }} workflow status: ${{ job.status }}\n${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
+            }
+        env:
+          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
--- a/.github/workflows/ailab_build_push_manual.yaml
+++ b/.github/workflows/ailab_build_push_manual.yaml
@ -8,15 +8,15 @@ env:
  CHATBOT_IMAGE_NAME: chatbot
  CODEGEN_IMAGE_NAME: codegen
  SUMMARIZER_IMAGE_NAME: summarizer
-  LLAMACPP_PYTHON_IMAGE_NAME: llamacpp-python
-  LLAMACPP_PYTHON_VULKAN_IMAGE_NAME: llamacpp-python-vulkan
-  LLAMACPP_PYTHON_CUDA_IMAGE_NAME: llamacpp-python-cuda
+  LLAMACPP_PYTHON_IMAGE_NAME: llamacpp_python
+  LLAMACPP_PYTHON_VULKAN_IMAGE_NAME: llamacpp_python_vulkan
+  LLAMACPP_PYTHON_CUDA_IMAGE_NAME: llamacpp_python_cuda
  CHROMADB_IMAGE_NAME: chromadb
  RAG_IMAGE_NAME: rag

 jobs:
  build-and-push-llamacpp-python-cuda-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -26,7 +26,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      - name: Build llamacpp_python cuda
        id: build_llamacpp_python_cuda
@ -54,7 +54,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_cuda.outputs.tags }}

  build-and-push-llamacpp-python-vulkan-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -64,7 +64,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -98,7 +98,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_vulkan.outputs.tags }}

  build-and-push-llamacpp-python-base-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -108,7 +108,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -141,7 +141,7 @@ jobs:
          tags: ${{ steps.build_llamacpp_python_base.outputs.tags }}

  build-and-push-rag-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -151,7 +151,7 @@ jobs:
        run: |
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -184,13 +184,13 @@ jobs:
          tags: ${{ steps.build_rag.outputs.tags }}

  build-and-push-chromadb-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
      # required for multi-arch builds
      - name: Install qemu dependency
        run: |
@ -223,13 +223,13 @@ jobs:
          tags: ${{ steps.build_chromadb.outputs.tags }}

  build-and-push-codegen-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -263,13 +263,13 @@ jobs:
          tags: ${{ steps.build_codegen_image.outputs.tags }}

  build-and-push-chatbot-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
@ -303,13 +303,13 @@ jobs:
          tags: ${{ steps.build_chatbot_image.outputs.tags }}

  build-and-push-summarizer-image:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write

    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      # required for multi-arch builds
      - name: Install qemu dependency
--- a/.github/workflows/mirror_repository.yaml
+++ b/.github/workflows/mirror_repository.yaml
@ -14,9 +14,9 @@ concurrency:
 jobs:
  mirror-repository:
    if: github.repository == 'containers/ai-lab-recipes'
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
        with:
          fetch-depth: 0

@ -30,7 +30,7 @@ jobs:
      - name: Publish Job Results to Slack
        id: slack
        if: always()
-        uses: slackapi/slack-github-action@v1.25.0
+        uses: slackapi/slack-github-action@v1.26.0
        with:
          payload: |
            {
--- a/.github/workflows/model_converter.yaml
+++ b/.github/workflows/model_converter.yaml
@ -0,0 +1,73 @@
+name: Update quay.io/ai-lab model images
+
+on:
+  pull_request:
+    branches:
+      - main
+    paths:
+      - 'convert_models/**'
+      - '!convert_models/README.md'
+      - '.github/workflows/model_converter.yaml'
+  push:
+    branches:
+      - main
+    paths:
+      - 'convert_models/**'
+      - '!convert_models/README.md'
+      - '.github/workflows/model_converter.yaml'
+  
+  workflow_dispatch:
+
+env:
+  REGISTRY: quay.io
+  REGISTRY_ORG: ai-lab
+
+jobs:
+  model-converter-build-and-push:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    strategy:
+      matrix:
+        include:
+          - platforms: linux/amd64,linux/arm64
+    runs-on: ubuntu-24.04
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - name: Remove unnecessary files
+        run: |
+          sudo rm -rf /usr/share/dotnet
+          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+
+      - uses: actions/checkout@v4.1.7
+
+      - name: Install qemu dependency
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y qemu-user-static
+      
+      - name: Build Image
+        id: build_image
+        uses: redhat-actions/buildah-build@v2.13
+        with:
+          image: ${{ env.REGISTRY_ORG }}/model-converter
+          platforms: ${{ matrix.platforms }}
+          tags: latest
+          containerfiles: convert_models/Containerfile
+          context: convert_models
+
+      - name: Login to Container Registry
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/podman-login@v1.7
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ secrets.REGISTRY_USER }}
+          password: ${{ secrets.REGISTRY_PASSWORD }}
+
+      - name: Push image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ steps.build_image.outputs.image }}
+          tags: ${{ steps.build_image.outputs.tags }}
+          registry: ${{ env.REGISTRY }}
--- a/.github/workflows/model_image_build_push.yaml
+++ b/.github/workflows/model_image_build_push.yaml
@ -1,113 +0,0 @@
-name: Update quay.io/ai-lab model images
-
-on:
-  schedule: # schedule the job to run at 12 AM daily
-   - cron: '0 0 * * *'
-  
-  workflow_dispatch:
-
-env:
-  REGISTRY: quay.io/ai-lab
-  MODEL_CONVERTER_IMAGE_NAME: model-converter
-  MISTRAL_MODEL_IMAGE_NAME: mistral-7b-instruct
-  MISTRAL_LABEL: v0.1.Q4_K_M.gguf
-  MISTRAL_MODEL_URL: https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf
-
-jobs:
-  build-and-push-model-converter-image:
-    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-latest
-    permissions:
-      contents: read
-      packages: write
-
-    steps:
-      # recover disk space
-      - name: Remove unnecessary files
-        run: |
-          sudo rm -rf /usr/share/dotnet
-          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-
-      - uses: actions/checkout@v4.1.1
-
-      # required for multi-arch builds
-      - name: Install qemu dependency
-        run: |
-          sudo apt-get update
-          sudo apt-get install -y qemu-user-static
-
-      - name: Build model-converter image
-        id: build_convert_models_image
-        uses: redhat-actions/buildah-build@v2
-        with:
-          image: ${{ env.MODEL_CONVERTER_IMAGE_NAME }}
-          tags: latest
-          platforms: linux/amd64, linux/arm64
-          context: models/convert_models
-          containerfiles: ./models/convert_models/Containerfile
-
-      - name: Login to quay.io
-        uses: redhat-actions/podman-login@v1
-        with:
-          registry: quay.io
-          username: ${{ secrets.REGISTRY_USER }}
-          password: ${{ secrets.REGISTRY_PASSWORD }}
-
-      - name: Push model-converter image
-        id: push_convert_models_image
-        uses: redhat-actions/push-to-registry@v2
-        with:
-          registry: ${{ env.REGISTRY }}
-          image: ${{ steps.build_convert_models_image.outputs.image }}
-          tags: ${{ steps.build_convert_models_image.outputs.tags }}
-
-  build-and-push-mistral-model-image:
-    if: contains( github.event.pull_request.labels.*.name, 'hold-tests')
-    runs-on: ubuntu-latest
-    permissions:
-      contents: read
-      packages: write
-
-    steps:
-      # need enough disk space to download model
-      - name: Remove unnecessary files
-        run: |
-          sudo rm -rf /usr/share/dotnet
-          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
-
-      - uses: actions/checkout@v4.1.1
-
-      # required for multi-arch builds
-      - name: Install qemu dependency
-        run: |
-          sudo apt-get update
-          sudo apt-get install -y qemu-user-static
-
-      - name: Build mistral model image
-        id: build_mistral_model_image
-        uses: redhat-actions/buildah-build@v2
-        with:
-          image: ${{ env.MISTRAL_MODEL_IMAGE_NAME }}
-          tags: latest
-          platforms: linux/amd64, linux/arm64
-          context: models
-          labels: |
-            ${{ env.MISTRAL_LABEL }}
-          build-args: |
-            MODEL_URL=${{ env.MISTRAL_MODEL_URL }}
-          containerfiles: ./models/Containerfile
-
-      - name: Login to quay.io
-        uses: redhat-actions/podman-login@v1
-        with:
-          registry: quay.io
-          username: ${{ secrets.REGISTRY_USER }}
-          password: ${{ secrets.REGISTRY_PASSWORD }}
-
-      - name: Push mistral model image
-        id: push_mistral_model_image
-        uses: redhat-actions/push-to-registry@v2
-        with:
-          registry: ${{ env.REGISTRY }}
-          image: ${{ steps.build_mistral_model_image.outputs.image }}
-          tags: ${{ steps.build_mistral_model_image.outputs.tags }}
--- a/.github/workflows/model_servers.yaml
+++ b/.github/workflows/model_servers.yaml
@ -5,14 +5,18 @@ on:
    branches:
      - main
    paths:
-      - ./model_servers/**
+      - 'model_servers/**'
+      - 'models/Makefile'
      - .github/workflows/model_servers.yaml
  push:
    branches:
      - main
    paths:
-      - ./model_servers/
+      - 'model_servers/**'
+      - 'models/Makefile'
      - .github/workflows/model_servers.yaml
+    tags:
+      - '*'

  workflow_dispatch:

@ -21,30 +25,48 @@ env:
  REGISTRY_ORG: containers

 jobs:
-  build-and-push-image:
+  model-servers-buid-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
    strategy:
      matrix:
        include:
          - image_name: llamacpp_python
-            model: mistral
+            model: granite
            flavor: base
            directory: llamacpp_python
            platforms: linux/amd64,linux/arm64
            no_gpu: 1
-          - image_name: llamacpp_python_cuda
-            model: mistral
+          - image_name: llamacpp-python-cuda
+            model: granite
            flavor: cuda
            directory: llamacpp_python
+            platforms: linux/amd64,linux/arm64
+            no_gpu: 0
+          - image_name: llamacpp-python-vulkan-amd
+            model: granite
+            flavor: vulkan/amd64
+            directory: llamacpp_python
            platforms: linux/amd64
-            cuda: 1
+            no_gpu: 0
+          - image_name: llamacpp-python-vulkan-arm
+            model: granite
+            flavor: vulkan/arm64
+            directory: llamacpp_python
+            platforms: linux/arm64
+            no_gpu: 0
          - image_name: whispercpp
            model: whisper-small
            flavor: base
            directory: whispercpp
            platforms: linux/amd64,linux/arm64
            no_gpu: 1
-    runs-on: ubuntu-latest
+          - image_name: object_detection_python
+            model: facebook-detr-resnet-101
+            flavor: base
+            directory: object_detection_python
+            platforms: linux/amd64,linux/arm64
+            no_gpu: 1
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -59,12 +81,17 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
          sudo apt-get update
          sudo apt-get install -y qemu-user-static
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
      
      - name: Build Image
        id: build_image
@ -72,19 +99,14 @@ jobs:
        with:
          image: ${{ env.REGISTRY }}/${{ github.repository_owner}}/${{ matrix.image_name }}
          platforms: ${{ matrix.platforms }}
-          tags: latest
+          tags: latest ${{ github.ref_type == 'tag' && github.ref_name || '' }}
          containerfiles: ./model_servers/${{ matrix.directory }}/${{ matrix.flavor }}/Containerfile
          context: model_servers/${{ matrix.directory }}/

      - name: Download model
-        working-directory: ./model_servers/${{ matrix.directory }}/
+        working-directory: ./models
        run: make download-model-${{ matrix.model }}

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install python dependencies
        working-directory: ./model_servers/${{ matrix.directory }}/
        run: make install
--- a/.github/workflows/models.yaml
+++ b/.github/workflows/models.yaml
@ -0,0 +1,94 @@
+name: Update quay.io/ai-lab model images
+
+on:
+  schedule: # schedule the job to run at 12 AM daily
+   - cron: '0 0 * * *'
+
+  pull_request:
+    branches:
+      - main
+    paths:
+      - .github/workflows/models.yaml
+  push:
+    branches:
+      - main
+    paths:
+      - .github/workflows/models.yaml
+  
+  workflow_dispatch:
+
+env:
+  REGISTRY: quay.io
+  REGISTRY_ORG: ai-lab
+
+jobs:
+  models-build-and-push:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    strategy:
+      matrix:
+        include:
+          - image_name: mistral-7b-code-16k-qlora
+            label: Q4_K_M
+            url: https://huggingface.co/TheBloke/Mistral-7B-Code-16K-qlora-GGUF/resolve/main/mistral-7b-code-16k-qlora.Q4_K_M.gguf
+            platforms: linux/amd64,linux/arm64
+          - image_name: mistral-7b-instruct
+            label: Q4_K_M
+            url: https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf
+            platforms: linux/amd64,linux/arm64
+          - image_name: merlinite-7b-lab
+            label: Q4_K_M
+            url: https://huggingface.co/instructlab/merlinite-7b-lab-GGUF/resolve/main/merlinite-7b-lab-Q4_K_M.gguf
+            platforms: linux/amd64,linux/arm64
+          - image_name: granite-7b-lab
+            label: Q4_K_M
+            url: https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf
+            platforms: linux/amd64,linux/arm64
+          - image_name: whisper-small
+            url: https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin
+            platforms: linux/amd64,linux/arm64
+    runs-on: ubuntu-24.04
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - name: Remove unnecessary files
+        run: |
+          sudo rm -rf /usr/share/dotnet
+          sudo rm -rf "$AGENT_TOOLSDIRECTORY"
+
+      - uses: actions/checkout@v4.1.7
+
+      - name: Install qemu dependency
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y qemu-user-static
+      
+      - name: Build Image
+        id: build_image
+        uses: redhat-actions/buildah-build@v2.13
+        with:
+          image: ${{ env.REGISTRY_ORG }}/${{ matrix.image_name }}
+          platforms: ${{ matrix.platforms }}
+          labels: |
+            ${{ matrix.label }}
+          build-args: |
+            MODEL_URL=${{ matrix.url }}
+          tags: latest
+          containerfiles: ./models/Containerfile
+          context: models
+
+      - name: Login to Container Registry
+        if: (github.event_name == 'push' && github.ref == 'refs/heads/main') || (github.event_name == 'workflow_dispatch' && github.ref == 'refs/heads/main')
+        uses: redhat-actions/podman-login@v1.7
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ secrets.REGISTRY_USER }}
+          password: ${{ secrets.REGISTRY_PASSWORD }}
+
+      - name: Push image
+        if: (github.event_name == 'push' && github.ref == 'refs/heads/main') || (github.event_name == 'workflow_dispatch' && github.ref == 'refs/heads/main')
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ steps.build_image.outputs.image }}
+          tags: ${{ steps.build_image.outputs.tags }}
+          registry: ${{ env.REGISTRY }}
--- a/.github/workflows/object_detection.yaml
+++ b/.github/workflows/object_detection.yaml
@ -0,0 +1,89 @@
+name: Object Detection
+
+on:
+  pull_request:
+    branches:
+      - main
+    paths:
+      - ./recipes/computer_vision/object_detection/**
+      - .github/workflows/object_detection.yaml
+  push:
+    branches:
+      - main
+    paths:
+      - ./recipes/computer_vision/object_detection/**
+      - .github/workflows/object_detection.yaml
+
+  workflow_dispatch:
+
+env:
+  REGISTRY: ghcr.io
+  REGISTRY_ORG: containers
+  RECIPE_NAME: object_detection
+  RECIPE_TYPE: computer_vision
+  IMAGE_NAME: object_detection_client
+
+jobs:
+  object-detection-client-build-and-push:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-24.04
+    permissions:
+      contents: read
+      packages: write
+    services:
+      registry:
+        image: registry:2.8.3
+        ports:
+          - 5000:5000
+    steps:
+      - uses: actions/checkout@v4.1.7
+
+      - name: Install qemu dependency
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y qemu-user-static
+
+      - name: Build Image
+        id: build_image
+        uses: redhat-actions/buildah-build@v2.13
+        with:
+          image: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/${{ env.IMAGE_NAME }}
+          tags: latest
+          platforms: linux/amd64,linux/arm64
+          containerfiles: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}/app/Containerfile
+          context: recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}/app
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'
+
+      - name: Install Dependencies
+        working-directory: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}
+        run: make install
+
+      - name: Download model
+        working-directory: ./models
+        run: make download-model-facebook-detr-resnet-101
+
+      - name: Run Functional Tests
+        shell: bash
+        run: make functional-tests
+        working-directory: ./recipes/${{ env.RECIPE_TYPE }}/${{ env.RECIPE_NAME }}
+
+      - name: Login to Registry
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/podman-login@v1.7
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Push Image
+        id: push_image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ steps.build_image.outputs.image }}
+          tags: ${{ steps.build_image.outputs.tags }}
+          registry: ${{ env.REGISTRY }}
--- a/.github/workflows/rag.yaml
+++ b/.github/workflows/rag.yaml
@ -5,16 +5,16 @@ on:
    branches:
      - main
    paths:
-      - ./recipes/common/Makefile.common
-      - ./recipes/natural_language_processing/rag/**
-      - .github/workflows/rag.yaml
+      - 'recipes/common/Makefile.common'
+      - 'recipes/natural_language_processing/rag/**'
+      - '.github/workflows/rag.yaml'
  push:
    branches:
      - main
    paths:
-      - ./recipes/common/Makefile.common
-      - ./recipes/natural_language_processing/rag/**
-      - .github/workflows/rag.yaml
+      - 'recipes/common/Makefile.common'
+      - 'recipes/natural_language_processing/rag/**'
+      - '.github/workflows/rag.yaml'

  workflow_dispatch:

@ -23,9 +23,9 @@ env:
  IMAGE_NAME: rag

 jobs:
-  build-and-push-image:
+  rag-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -40,7 +40,7 @@ jobs:
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf "$AGENT_TOOLSDIRECTORY"

-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -58,7 +58,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

@ -67,8 +67,8 @@ jobs:
        run: make install

      - name: Download model
-        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
-        run: make download-model-mistral
+        working-directory: ./models
+        run: make download-model-granite

      - name: Run Functional Tests
        shell: bash
--- a/.github/workflows/summarizer.yaml
+++ b/.github/workflows/summarizer.yaml
@ -23,9 +23,9 @@ env:
  IMAGE_NAME: summarizer

 jobs:
-  build-and-push-image:
+  summarizer-build-and-push:
    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    permissions:
      contents: read
      packages: write
@ -35,7 +35,7 @@ jobs:
        ports:
          - 5000:5000
    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7

      - name: Install qemu dependency
        run: |
@ -53,7 +53,7 @@ jobs:
          context: recipes/natural_language_processing/${{ env.IMAGE_NAME }}/app

      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
+        uses: actions/setup-python@v5.1.1
        with:
          python-version: '3.11'

@ -62,8 +62,8 @@ jobs:
        run: make install

      - name: Download model
-        working-directory: ./recipes/natural_language_processing/${{ env.IMAGE_NAME }}
-        run: make download-model-mistral
+        working-directory: ./models
+        run: make download-model-granite

      - name: Run Functional Tests
        shell: bash
--- a/.github/workflows/test-trace-steps.yaml
+++ b/.github/workflows/test-trace-steps.yaml
@ -0,0 +1,94 @@
+# To run locally
+# act -W .github/workflows/test-trace-steps.yaml --container-architecture linux/amd64 -b ci/logs:/logs
+
+name: Test Workflow
+
+on:
+  pull_request:
+    branches:
+      - main
+    paths:
+      - .github/workflows/test-trace-steps.yaml
+  workflow_dispatch:
+
+jobs:
+  test-build:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-24.04
+    steps:
+    - uses: actions/checkout@v4.1.7
+    - name: Set up Python
+      uses: actions/setup-python@v5.1.1
+      with:
+        python-version: '3.11'
+
+    - name: Install Python dependencies
+      run: |
+        pip install --no-cache-dir opentelemetry-sdk opentelemetry-exporter-otlp opentelemetry-instrumentation
+
+    - name: Download OpenTelemetry Collector Contrib
+      run: |
+        wget https://github.com/open-telemetry/opentelemetry-collector-releases/releases/download/v0.103.0/otelcol-contrib_0.103.0_linux_amd64.tar.gz
+        tar -xvf otelcol-contrib_0.103.0_linux_amd64.tar.gz
+
+    - name: Write secrets to files
+      run: |
+        echo "${{ secrets.ROSA_OTEL_CACERT }}" > /tmp/ca.crt
+        echo "${{ secrets.ROSA_OTEL_SERVER_CRT }}" > /tmp/server.crt
+        echo "${{ secrets.ROSA_OTEL_SERVER_KEY }}" > /tmp/server.key
+
+    - name: Configure OpenTelemetry Collector
+      run: |
+        echo '
+        receivers:
+          otlp:
+            protocols:
+              grpc:
+              http:
+        exporters:
+          otlphttp:
+            endpoint: "${{ secrets.ROSA_OTEL_ENDPOINT }}"
+            tls:
+              insecure: false
+              cert_file: /tmp/server.crt
+              key_file: /tmp/server.key
+              ca_file: /tmp/ca.crt
+          debug:
+            verbosity: detailed
+        service:
+          pipelines:
+            traces:
+              receivers: [otlp]
+              exporters: [debug, otlphttp]
+        ' > otel-collector-config.yaml
+
+    - name: Run OpenTelemetry Collector
+      run: |
+        ./otelcol-contrib --config otel-collector-config.yaml > otel-collector.log 2>&1 &
+
+    - name: Start job trace
+      run: |
+        export WORKFLOW_NAME="test-trace"
+        export JOB_NAME="test-build"
+        export TRACE_ACTION="start"
+        python ci/trace-steps.py
+
+    - name: Build
+      run: |
+        echo "Simulating build step..."
+        sleep 2
+
+    - name: Test
+      run: |
+        echo "Simulating test step..."
+        sleep 2
+
+    - name: End job trace
+      run: |
+        export WORKFLOW_NAME="test-trace"
+        export JOB_NAME="test-build"
+        export TRACE_ACTION="end"
+        python ci/trace-steps.py
+
+    - name: Display OpenTelemetry Collector Logs
+      run: cat otel-collector.log
--- a/.github/workflows/testing_framework.yaml
+++ b/.github/workflows/testing_framework.yaml
@ -1,10 +1,10 @@
 name: Testing Framework

 on:
-  schedule: # schedule the job to run every hour
-   - cron: '0 * * * *'
-  
-  workflow_dispatch:
+  schedule: # schedule the job to run once a day
+   - cron: '0 0 * * *'
+
+  #workflow_dispatch:

  # pull_request: ## temporary for debugging development purposes
  #   branches:
@ -13,7 +13,7 @@ on:
 env:
  TF_VAR_aws_region: "eu-west-2"
  TF_VAR_aws_ami_owners: '["125523088429"]'
-  TF_VAR_aws_ami_name: '["Fedora-Cloud-Base-*"]'
+  TF_VAR_aws_ami_name: '["Fedora-Cloud-Base-39*"]'
  TF_VAR_aws_volume_size: 100
  TF_VAR_aws_access_key: ${{ secrets.AWS_ACCESS_KEY_ID }}
  TF_VAR_aws_secret_key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
@ -28,13 +28,13 @@ concurrency:
 jobs:
  integration-tests:
    if: github.repository == 'containers/ai-lab-recipes'
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    strategy:
      fail-fast: false
      matrix:
        include:
          - arch: amd64
-            aws_image_type: t3a.medium	
+            aws_image_type: t3a.medium
            aws_ami_architecture: x86_64
          - arch: arm64
            aws_image_type: m7g.medium
@ -44,20 +44,25 @@ jobs:
            aws_ami_architecture: x86_64
    steps:
      - name: Checkout
-        uses: actions/checkout@v4.1.1
+        uses: actions/checkout@v4.1.7
        with:
-          path: main
+          ref: 'main'
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'

      - name: Checkout terraform module
        id: checkout-module
-        uses: actions/checkout@v4.1.1
+        uses: actions/checkout@v4.1.7
        with:
          repository: containers/terraform-test-environment-module
          path: terraform-test-environment-module
          ref: 'main'

      - name: Setup Terraform
-        uses: hashicorp/setup-terraform@v3.0.0
+        uses: hashicorp/setup-terraform@v3.1.2
        with:
          terraform_version: "1.7.5"
          terraform_wrapper: false
@ -73,7 +78,7 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Terraform Output
        id: terraform-output
        run: |
@ -84,31 +89,26 @@ jobs:

      - name: Ansible Collections
        run: ansible-galaxy install -r ./provision/requirements.yml
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot

      - name: Provision
        run: |
-          ansible-playbook ./main/recipes/natural_language_processing/chatbot/provision/playbook.yml \
+          ansible-playbook ./recipes/natural_language_processing/chatbot/provision/playbook.yml \
            -i terraform-test-environment-module/hosts.ini \
            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }}
        env:
          ANSIBLE_HOST_KEY_CHECKING: false

-      - name: Set up Python
-        uses: actions/setup-python@v5.1.0
-        with:
-          python-version: '3.11'
-
      - name: Install Dependencies
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot
        run: make install

      - name: Run Integration Tests
-        working-directory: ./main/recipes/natural_language_processing/chatbot
+        working-directory: ./recipes/natural_language_processing/chatbot
        run: make integration-tests
        env:
          URL: ${{ steps.terraform-output.outputs.url }}
- 
+
      - name: Destroy Test Environment
        id: down
        if: always()
@ -117,11 +117,11 @@ jobs:
        env:
          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
-      
+
      - name: Publish Job Results to Slack
        id: slack
        if: always()
-        uses: slackapi/slack-github-action@v1.25.0
+        uses: slackapi/slack-github-action@v1.26.0
        with:
          payload: |
            {
@ -131,7 +131,7 @@ jobs:
          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}

  release-images:
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-24.04
    needs: integration-tests
    if: success()
    strategy:
@ -154,11 +154,11 @@ jobs:
        env:
          SOURCE_REGISTRY: ghcr.io/containers
          TARGET_REGISTRY: quay.io/ai-lab
-      
+
      - name: Publish Job Results to Slack
        id: slack
        if: always()
-        uses: slackapi/slack-github-action@v1.25.0
+        uses: slackapi/slack-github-action@v1.26.0
        with:
          payload: |
            {
@ -171,7 +171,12 @@ jobs:
    if: github.repository == 'containers-mirror/ai-lab-recipes'
    runs-on: ubuntu-22.04-2core
    steps:
-      - uses: actions/checkout@v4.1.1
+      - uses: actions/checkout@v4.1.7
+
+      - name: Set up Python
+        uses: actions/setup-python@v5.1.1
+        with:
+          python-version: '3.11'

      - name: chatbot
        working-directory: ./recipes/natural_language_processing/chatbot
@ -180,7 +185,7 @@ jobs:
      - name: Publish Job Results to Slack
        id: slack
        if: always()
-        uses: slackapi/slack-github-action@v1.25.0
+        uses: slackapi/slack-github-action@v1.26.0
        with:
          payload: |
            {
--- a/.github/workflows/training-e2e.yaml
+++ b/.github/workflows/training-e2e.yaml
@ -0,0 +1,154 @@
+name: traning E2E
+
+on:
+  schedule: # schedule the job to run every day at midnight
+    - cron: '0 12 * * *'
+
+  pull_request:
+    branches:
+      - main
+    paths:
+      - .github/workflows/training-e2e.yaml
+      - ./training/**
+
+  workflow_dispatch:
+
+env:
+  TF_VAR_aws_region: "eu-west-2"
+  TF_VAR_aws_ami_owners: '["309956199498"]'
+  TF_VAR_aws_ami_name: '["*RHEL-9.4*"]'
+  TF_VAR_aws_volume_size: 500
+  TF_VAR_aws_access_key: ${{ secrets.AWS_ACCESS_KEY_ID }}
+  TF_VAR_aws_secret_key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+  HF_TOKEN: ${{ secrets.HF_TOKEN }}
+
+concurrency:
+  group: ${{ github.workflow }}
+  cancel-in-progress: false
+
+jobs:
+  e2e:
+    if: github.repository == 'containers/ai-lab-recipes' && !contains(github.event.pull_request.labels.*.name, 'hold-tests')
+    runs-on: ubuntu-24.04
+    strategy:
+      fail-fast: false
+      max-parallel: 1
+      matrix:
+        include:
+          - arch: amd64
+            aws_image_type: g5.8xlarge
+            image_name: nvidia-bootc
+            aws_ami_architecture: x86_64
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4.1.7
+        with:
+          path: main
+
+      - name: Checkout terraform module
+        id: checkout-module
+        uses: actions/checkout@v4.1.7
+        with:
+          repository: containers/terraform-test-environment-module
+          path: terraform-test-environment-module
+          ref: 'main'
+
+      - name: Setup Terraform
+        uses: hashicorp/setup-terraform@v3.1.2
+        with:
+          terraform_version: "1.7.5"
+          terraform_wrapper: false
+
+      - name: Init
+        run: terraform init
+        working-directory: terraform-test-environment-module
+
+      - name: Bootstrap
+        id: up
+        run: terraform apply -auto-approve -lock=false
+        working-directory: terraform-test-environment-module
+        env:
+          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
+          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
+
+      - name: Terraform Output
+        id: terraform-output
+        run: |
+          echo "id=$(terraform output id | xargs)" >> $GITHUB_OUTPUT
+          echo "url=$(terraform output host | xargs)" >> $GITHUB_OUTPUT
+          echo "ssh_public_key=$(terraform output ssh_public_key | xargs)" >> $GITHUB_OUTPUT
+          echo "pem_filename=$(terraform output pem_filename | xargs)" >> $GITHUB_OUTPUT
+        working-directory: terraform-test-environment-module
+
+      - name: Ansible Collections
+        run: ansible-galaxy install -r ./tests/provision/requirements.yml
+        working-directory: ./main/training
+
+      - name: Provision
+        run: |
+          ansible-playbook ./main/training/tests/provision/playbook.yml \
+            -i terraform-test-environment-module/hosts.ini \
+            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }} \
+            --extra-vars "image_name=${{ matrix.image_name }}" \
+            --extra-vars "ssh_public_key='${{ steps.terraform-output.outputs.ssh_public_key }}'" \
+            --extra-vars "registry_user=${{ secrets.REGISTRY_USER }}" \
+            --extra-vars "registry_password=${{ secrets.REGISTRY_PASSWORD }}"
+        env:
+          ANSIBLE_CONFIG: ./main/training/tests/ansible.cfg
+
+      # - name: Setup tmate session
+      #   uses: mxschmitt/action-tmate@v3.18
+      #   timeout-minutes: 20
+      #   with:
+      #     detached: true
+      #     limit-access-to-actor: false
+
+      - name: Setup tmate session
+        uses: mxschmitt/action-tmate@v3.18
+        timeout-minutes: 60
+        with:
+          detached: true
+          limit-access-to-actor: false
+
+      - name: Run tests
+        run: |
+          ansible-playbook ./main/training/tests/e2e-tests/playbook.yml \
+            -i terraform-test-environment-module/hosts.ini \
+            --private-key=terraform-test-environment-module/${{ steps.terraform-output.outputs.pem_filename }} \
+            --extra-vars "HF_TOKEN=${{ secrets.HF_TOKEN }}" \
+            --extra-vars "image_name=${{ matrix.image_name }}" \
+            --extra-vars "ssh_public_key='${{ steps.terraform-output.outputs.ssh_public_key }}'" \
+            --extra-vars "registry_user=${{ secrets.REGISTRY_USER }}" \
+            --extra-vars "registry_password=${{ secrets.REGISTRY_PASSWORD }}"
+        env:
+          ANSIBLE_CONFIG: ./main/training/tests/ansible.cfg
+
+      # This should exist in the final workflow
+      # - name: Setup tmate session
+      #   if: ${{ failure() }}
+      #   uses: mxschmitt/action-tmate@v3.18
+      #   timeout-minutes: 15
+      #   with:
+      #     detached: true
+      #     limit-access-to-actor: false
+
+      - name: Destroy Test Environment
+        id: down
+        if: always()
+        run: terraform destroy -auto-approve -lock=false
+        working-directory: terraform-test-environment-module
+        env:
+          TF_VAR_aws_instance_type: ${{ matrix.aws_image_type }}
+          TF_VAR_aws_ami_architecture: ${{ matrix.aws_ami_architecture }}
+
+      - name: Publish Job Results to Slack
+        id: slack
+        if: always()
+        uses: slackapi/slack-github-action@v1.26.0
+        with:
+          payload: |
+            {
+              "text": "${{ github.workflow }} workflow status: ${{ job.status }}\n${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
+            }
+        env:
+          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
--- a/.github/workflows/training_bootc.yaml
+++ b/.github/workflows/training_bootc.yaml
@ -0,0 +1,247 @@
+name: Training Bootc image builds
+
+on:
+  push:
+    branches: [ main ]
+    paths:
+      - 'training/**'
+      - '.github/workflows/training_bootc.yaml'
+
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}
+  cancel-in-progress: false
+
+env:
+  REGISTRY: quay.io
+  REGISTRY_ORG: ai-lab
+  REGION: us-east-1
+
+jobs:
+  start-runner:
+    name: Start self-hosted EC2 runner
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ubuntu-latest
+    outputs:
+      label: ${{ steps.start-ec2-runner.outputs.label }}
+      ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }}
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@v1
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ env.REGION }}
+      - name: Start EC2 runner
+        id: start-ec2-runner
+        uses: machulav/ec2-github-runner@v2
+        with:
+          mode: start
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          ec2-image-id: ami-0154957ba4ce98784
+          ec2-instance-type: m7i.12xlarge
+          subnet-id: subnet-0b1e1d94240813658
+          security-group-id: sg-055105753f5e8bd83
+
+  nvidia-bootc-builder-image:
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    strategy:
+      matrix:
+        include:
+          - image_name: nvidia-builder
+            context: training/nvidia-bootc
+            arch: amd64
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    needs: start-runner
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - uses: actions/checkout@v4.1.7
+
+      - name: mkdir root/.docker directory
+        run: |
+          mkdir -p ~/.docker
+
+      - name: Login to Container Registry
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+      - name: generate a ssh key - USER SHOULD INJECT THEIR OWN AND REBUILD IF THEY USE THIS IMAGE
+        run: |
+          ssh-keygen -t rsa -b 4096 -f ~/.ssh/id_rsa -N ""
+
+      - name: Build Image
+        id: build_image
+        run: make driver-toolkit ARCH=${{ matrix.arch }}
+        working-directory: ${{ matrix.context }}
+
+      - name: tag image as nvidia-builder
+        run: podman tag ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/driver-toolkit:latest ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}/${{ matrix.image_name}}:latest
+
+      - name: Push image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}
+          image: driver-toolkit
+          tags: latest
+
+      - name: push the nvidia-builder image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ matrix.image_name}}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}
+
+      - name: Publish Job Results to Slack
+        id: slack
+        if: always()
+        uses: slackapi/slack-github-action@v1.26.0
+        with:
+          payload: |
+            {
+              "text": "${{ github.workflow }} workflow status: ${{ job.status }}\n${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
+            }
+        env:
+          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
+
+  nvidia-bootc-image:
+    strategy:
+      matrix:
+        include:
+          - image_name: nvidia-bootc
+            driver_version: "550.54.15"
+            context: training/nvidia-bootc
+            arch: amd64
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    needs: [ nvidia-bootc-builder-image, start-runner ]
+    steps:
+      - uses: actions/checkout@v4.1.7
+
+      - name: mkdir root/.docker directory
+        run: |
+          mkdir -p ~/.docker
+
+      - name: generate a ssh key - USER SHOULD INJECT THEIR OWN AND REBUILD IF THEY USE THIS IMAGE and overwrite the existing one
+        run: |
+          ssh-keygen -t rsa -b 4096 -f ~/.ssh/id_rsa -N "" <<<y
+
+      - name: Login to Container Registry
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+
+      - name: generate the local OCI assets
+        run: |
+          cd training
+          make -j vllm
+          make -j deepspeed
+          make -j instruct-nvidia
+
+      - name: Build Image
+        id: build_image
+        run: make bootc DRIVER_VERSION=${{ matrix.driver_version }} ARCH=${{ matrix.arch }} SSH_PUBKEY=~/.ssh/id_rsa.pub
+        working-directory: ${{ matrix.context }}
+
+      - name: Push image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ matrix.image_name }}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}
+
+      - name: Publish Job Results to Slack
+        id: slack
+        if: always()
+        uses: slackapi/slack-github-action@v1.26.0
+        with:
+          payload: |
+            {
+              "text": "${{ github.workflow }} workflow status: ${{ job.status }}\n${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
+            }
+        env:
+          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
+
+  bootc-images:
+    strategy:
+      matrix:
+        include:
+          - image_name: intel-bootc
+            context: training/intel-bootc
+            arch: amd64
+            gpu: intel
+          - image_name: amd-bootc
+            context: training/amd-bootc
+            arch: amd64
+            gpu: amd
+    if: "!contains(github.event.pull_request.labels.*.name, 'hold-tests')"
+    runs-on: ${{ needs.start-runner.outputs.label }}
+    needs: [ start-runner, nvidia-bootc-builder-image ]
+    continue-on-error: true
+    steps:
+      - uses: actions/checkout@v4.1.7
+
+      - name: mkdir root/.docker directory
+        run: |
+          mkdir -p ~/.docker
+
+      - name: Login to Container Registry
+        run: podman login -u ${{ secrets.REGISTRY_USER }} -p ${{ secrets.REGISTRY_PASSWORD }} ${{ env.REGISTRY }}
+
+      - name: generate the local OCI assets
+        run: |
+          cd training
+          make -j vllm
+          make -j deepspeed
+          make -j instruct-${{ matrix.gpu}}
+
+      - name: Build Image
+        id: build_image
+        run: make bootc ARCH=${{ matrix.arch }} INSTRUCTLAB_IMAGE=${{env.REGISTRY}}/${{env.REGISTRY_ORG}}/instruct-${{ matrix.gpu }}:latest
+        working-directory: ${{ matrix.context }}
+
+      - name: Push image
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
+        uses: redhat-actions/push-to-registry@v2.8
+        with:
+          image: ${{ matrix.image_name }}
+          tags: latest
+          registry: ${{ env.REGISTRY }}/${{ env.REGISTRY_ORG }}
+
+      - name: Publish Job Results to Slack
+        id: slack
+        if: always()
+        uses: slackapi/slack-github-action@v1.26.0
+        with:
+          payload: |
+            {
+              "text": "${{ github.workflow }} workflow status: ${{ job.status }}\n${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}"
+            }
+        env:
+          SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
+
+  stop-runner:
+    name: Stop self-hosted EC2 runner
+    needs:
+      - start-runner
+      - bootc-images
+      - nvidia-bootc-image
+    runs-on: ubuntu-latest
+    if: ${{ always() }} # required to stop the runner even if the error happened in the previous jobs
+    steps:
+      - name: Configure AWS credentials
+        uses: aws-actions/configure-aws-credentials@v1
+        with:
+          aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
+          aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
+          aws-region: ${{ secrets.AWS_REGION }}
+      - name: Stop EC2 runner
+        uses: machulav/ec2-github-runner@v2
+        with:
+          mode: stop
+          github-token: ${{ secrets.GH_PERSONAL_ACCESS_TOKEN }}
+          label: ${{ needs.start-runner.outputs.label }}
+          ec2-instance-id: ${{ needs.start-runner.outputs.ec2-instance-id }}
--- a/.gitignore
+++ b/.gitignore
@ -6,6 +6,13 @@ port_check.lock
 models/*
 !models/Makefile
 !models/README.md
+!models/download_hf_models.py
 convert_models/converted_models
 recipes/common/bin/*
 */.venv/
+**/venv/**
+training/cloud/examples
+training/instructlab/instructlab
+vector_dbs/milvus/volumes/milvus/*
+.idea
+**/volumes/**
--- a/2
+++ b/2
@ -1 +1 @@
-* @MichaelClifford @rhatdan @sallyom @lmilbaum @cgwalters
+* @MichaelClifford @rhatdan @sallyom @cgwalters @Gregory-Pereira @jeffmaury
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@ -44,13 +44,13 @@ application:
      containerfile: ./base/Containerfile
      model-service: true
      backend: 
-        - llama
+        - llama-cpp
      arch:
        - arm64
        - amd64
      ports:
        - 8001
-      image: quay.io/ai-lab/llamacppp-python:latest
+      image: quay.io/ai-lab/llamacpp_python:latest
    - name: streamlit-chat-app
      contextdir: .
      containerfile: app/Containerfile
@ -99,9 +99,9 @@ After creating your new recipe by adding the files above you might be asking you

 ## Contributing New Model Servers

-There are a number of options out there for model servers and we want to ensure that we provide developers with a variety of vetted options for the model server that will meet there applications needs.    
+There are a number of options out there for model servers and we want to ensure that we provide developers with a variety of vetted options for the model server that will meet their application's needs.    

-Deciding which model server is right for a particular use case primarily comes down to the kind of model you want to use (LLM, Object Detection, Data Classification, etc..) and the resources available (GPU, CPU, Cloud, Local).
+Deciding which model server is right for a particular use case primarily comes down to the kind of model you want to use (LLM, Object Detection, Data Classification, etc.) and the resources available (GPU, CPU, Cloud, Local).

 ### Adding a New Model Server

--- a/README.md
+++ b/README.md
@ -1,5 +1,7 @@
 # AI Lab Recipes

+![](/assets/ai_lab_recipes_logo.png) 
+
 This repo contains recipes for building and running containerized AI and LLM
 Applications with Podman.

@ -22,11 +24,11 @@ default. This server can be used for various generative AI applications with var
 However, each sample application can be paired with a variety of model servers.

 Learn how to build and run the llamacpp_python model server by following the
-[llamacpp_python model server README.](/model_servers/llamacpp_python/README.md).
+[llamacpp_python model server README](/model_servers/llamacpp_python/README.md).

 ## Current Recipes 

-Recipes consist to at least two components: A model server and an AI application.
+Recipes consist of at least two components: A model server and an AI application.
 The model server manages the model, and the AI application provides the specific 
 logic needed to perform some specific task such as chat, summarization, object 
 detection, etc. 
@ -49,5 +51,20 @@ For example, learn how to run the [chatbot recipe here](./recipes/natural_langua

 Images for many sample applications and models are available in `quay.io`. All
 currently built images are  tracked in
-[ai-lab-recipes-images.md](./ai-lab-recipes-images.md)
+[ailab-images.md](./ailab-images.md)

+## [Training](./training/README.md)
+
+Linux Operating System Bootable containers enabled for AI Training
+
+## Setting Up Git Hooks
+
+To install our standard git hooks, run the following command:
+
+```sh
+./install-hooks.sh
+```
+
+### pre-commit hook
+
+Ensures that `training/ilab-wrapper/ilab` is duplicated into `training/nvidia-bootc/duplicated/ilab-wrapper/ilab`
--- a/ailab-images.md
+++ b/ailab-images.md
@ -1,19 +1,34 @@
-## Images (x86_64, aarch64) currently built from GH Actions in this repository
+## Model Server Images (amd64, arm64) currently built from GH Actions in this repository

- quay.io/ai-lab/llamacpp-python:latest
+- quay.io/ai-lab/llamacpp_python:latest
 - quay.io/ai-lab/llamacpp-python-cuda:latest
 - quay.io/ai-lab/llamacpp-python-vulkan:latest
+- quay.io/redhat-et/locallm-object-detection-server:latest
+
+## Recipe Images (amd64, arm64)
 - quay.io/ai-lab/summarizer:latest
 - quay.io/ai-lab/chatbot:latest
 - quay.io/ai-lab/rag:latest
 - quay.io/ai-lab/codegen:latest
- quay.io/ai-lab/chromadb:latest
 - quay.io/redhat-et/locallm-object-detection-client:latest
- quay.io/redhat-et/locallm-object-detection-server:latest

-## Model Images (x86_64, aarch64)
+## Dependency images (amd64)

+Images used in the `Bootc` aspect of this repo or tooling images
+
+- quay.io/ai-lab/chromadb:latest
+- quay.io/ai-lab/model-converter:latest
+
+## Model Images (amd64, arm64)
+
+- quay.io/ai-lab/merlinite-7b-lab:latest
+    - [model download link](https://huggingface.co/instructlab/merlinite-7b-lab-GGUF/resolve/main/merlinite-7b-lab-Q4_K_M.gguf)
+- quay.io/ai-lab/granite-7b-lab:latest
+    - [model download link](https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf)
 - quay.io/ai-lab/mistral-7b-instruct:latest
-    - [model download link](https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf)
- quay.io/ai-lab/codellama-7b:latest
-    - [model download link](https://huggingface.co/TheBloke/CodeLlama-7B-Instruct-GGUF/resolve/main/codellama-7b-instruct.Q4_K_M.gguf) 
+    - [model download link](https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf)
+- quay.io/ai-lab/mistral-7b-code-16k-qlora:latest
+    - [model download link](https://huggingface.co/TheBloke/Mistral-7B-Code-16K-qlora-GGUF/resolve/main/mistral-7b-code-16k-qlora.Q4_K_M.gguf)
+- quay.io/ai-lab/whisper-small:latest
+    - [model download link](https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin)
+
--- a/assets/ai_lab_recipes_logo.png
+++ b/assets/ai_lab_recipes_logo.png
--- a/assets/chatbot_nodejs_ui.png
+++ b/assets/chatbot_nodejs_ui.png
--- a/assets/function_calling_nodejs_ui.png
+++ b/assets/function_calling_nodejs_ui.png
--- a/assets/rag_nodejs.png
+++ b/assets/rag_nodejs.png
--- a/ci/trace-steps.py
+++ b/ci/trace-steps.py
@ -0,0 +1,47 @@
+import os
+import time
+from datetime import datetime
+from opentelemetry import trace
+from opentelemetry.sdk.resources import Resource
+from opentelemetry.sdk.trace import TracerProvider
+from opentelemetry.sdk.trace.export import BatchSpanProcessor, ConsoleSpanExporter
+from opentelemetry.exporter.otlp.proto.grpc.trace_exporter import OTLPSpanExporter
+
+service_name = os.getenv("WORKFLOW_NAME", "default_service")
+job_name = os.getenv("JOB_NAME", "default_job")
+
+resource = Resource.create({"service.name": service_name})
+trace.set_tracer_provider(TracerProvider(resource=resource))
+tracer = trace.get_tracer(__name__)
+console_span_processor = BatchSpanProcessor(ConsoleSpanExporter())
+trace.get_tracer_provider().add_span_processor(console_span_processor)
+
+# Adding OTLP Span Exporter for actual data export
+otlp_exporter = OTLPSpanExporter(endpoint="localhost:4317", insecure=True)
+otlp_span_processor = BatchSpanProcessor(otlp_exporter)
+trace.get_tracer_provider().add_span_processor(otlp_span_processor)
+
+print("Tracer initialized with service name:", service_name)
+
+def set_start_time():
+    start_time = datetime.now().timestamp()
+    with open("/tmp/start_time.txt", "w") as file:
+        file.write(str(start_time))
+    print("Start time recorded")
+
+def calculate_duration():
+    with open("/tmp/start_time.txt", "r") as file:
+        start_time = float(file.read())
+    end_time = datetime.now().timestamp()
+    duration = end_time - start_time
+    print(f"Total Duration: {duration}s")
+    with tracer.start_as_current_span(job_name) as span:
+        span.set_attribute("total_duration_s", duration)
+
+if __name__ == "__main__":
+    action = os.getenv("TRACE_ACTION", "start")
+
+    if action == "start":
+        set_start_time()
+    elif action == "end":
+        calculate_duration()
--- a/convert_models/Containerfile
+++ b/convert_models/Containerfile
@ -1,7 +1,10 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
-WORKDIR /converter
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
+WORKDIR /opt/app-root/src/converter
+USER root
+RUN chown -R default:root /opt/app-root/src/converter
+USER default
 RUN git clone https://github.com/ggerganov/llama.cpp.git
 RUN cd llama.cpp/ && make
 RUN pip install -r llama.cpp/requirements.txt
-COPY . /converter/
+COPY . /opt/app-root/src/converter/
 ENTRYPOINT ["sh", "run.sh"]
--- a/convert_models/README.md
+++ b/convert_models/README.md
@ -1,12 +1,12 @@
 # Convert and Quantize Models

-Locallm currently relies on [llamacpp](https://github.com/ggerganov/llama.cpp) for its model service backend. Llamacpp requires that model be in a `*.gguf` format. 
+AI Lab Recipes' default model server is [llamacpp_python](https://github.com/abetlen/llama-cpp-python), which needs models to be in a `*.GGUF` format. 

-However, most models available on [huggingface](https://huggingface.co/models) are not provided directly as `*.gguf` files. More often they are provided as a set of `*.bin` files with some additional metadata files that are produced when the model is originally trained.
+However, most models available on [huggingface](https://huggingface.co/models) are not provided directly as `*.GGUF` files. More often they are provided as a set of `*.bin` or `*.safetensor` files with some additional metadata produced when the model is trained.

-There are of course a number of users on huggingface who provide `*gguf` versions of popular models. But this introduces an unnecessary interim dependency as well as possible security or licensing concerns.
+There are of course a number of users on huggingface who provide `*.GGUF` versions of popular models. But this introduces an unnecessary interim dependency as well as possible security or licensing concerns.

-To avoid these concerns and provide users with the maximum freedom of choice for their models, we provide a tool to quickly and easily convert and quantize a model on huggingface into a `*gguf` format for use with Locallm.   
+To avoid these concerns and provide users with the maximum freedom of choice for their models, we provide a tool to quickly and easily convert and quantize a model from huggingface into a `*.GGUF` format for use with our `*.GGUF` compatible model servers.   

 ![](/assets/model_converter.png)

@ -19,10 +19,10 @@ podman build -t converter .

 ## Quantize and Convert 

-You can run the conversion image directly with Podman in the terminal. You just need to provide it with the huggingface model you want to download, the quantization level you want to use and whether or not you want to keep the raw files after conversion.
+You can run the conversion image directly with podman in the terminal. You just need to provide it with the huggingface model name you want to download, the quantization level you want to use and whether or not you want to keep the raw files after conversion. "HF_TOKEN" is optional, it is required for private models.

 ```bash
-podman run -it --rm -v models:/converter/converted_models -e HF_MODEL_URL=<ORG/MODEL_NAME> -e QUANTIZATION=Q4_K_M -e KEEP_ORIGINAL_MODEL="False"
+podman run -it --rm -v models:/converter/converted_models -e HF_MODEL_URL=<ORG/MODEL_NAME> -e HF_TOKEN=<YOUR_HF_TOKEN_ID> -e QUANTIZATION=Q4_K_M -e KEEP_ORIGINAL_MODEL="False" converter
 ```

 You can also use the UI shown above to do the same.
@ -33,12 +33,12 @@ streamlit run convert_models/ui.py

 ## Model Storage and Use

-This process writes the models into a Podman volume under a `gguf/` directory and not directly back to the user's host machine (This could be changed in an upcoming update if it is required).
+This process writes the models into a podman volume under a `gguf/` directory and not directly back to the user's host machine (This could be changed in an upcoming update if it is required).

-If a user wants to access these models to use with the llamacpp model-service, they would simply point their model-service volume mount to the Podman volume created here. For example:
+If a user wants to access these models to use with the llamacpp_python model server, they would simply point their model service to the correct podman volume at run time. For example:

-```
-podman run -it -p 8001:8001 -v models:/locallm/models:Z -e MODEL_PATH=models/gguf/<MODEL_NAME> -e HOST=0.0.0.0 -e PORT=8001 llamacppserver
+```bash
+podman run -it -p 8001:8001 -v models:/opt/app-root/src/converter/converted_models/gguf:Z -e MODEL_PATH=/gguf/<MODEL_NAME> -e HOST=0.0.0.0 -e PORT=8001 llamacpp_python
 ```


--- a/convert_models/download_huggingface.py
+++ b/convert_models/download_huggingface.py
@ -3,9 +3,11 @@ import argparse

 parser = argparse.ArgumentParser()
 parser.add_argument("-m", "--model")
+parser.add_argument("-t", "--token")
 args = parser.parse_args()

 snapshot_download(repo_id=args.model,
+                token=args.token,
                local_dir=f"converted_models/{args.model}",
                local_dir_use_symlinks=True,
                cache_dir=f"converted_models/cache")
--- a/convert_models/run.sh
+++ b/convert_models/run.sh
@ -1,31 +1,32 @@
 #! /bin/bash

 hf_model_url=${HF_MODEL_URL}
+hf_token=${HF_TOKEN:="None"}
 model_org=$(echo $hf_model_url | sed -n 's/\(.*\)\/\(.*\)/\1/p')
 model_name=$(echo $hf_model_url | sed -n 's/\(.*\)\/\(.*\)/\2/p')
 keep_orgi=${KEEP_ORIGINAL_MODEL}

-if [ -e "/converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf" ]; then
+if [ -e "/opt/app-root/src/converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf" ]; then
    echo "$model_org-$model_name-${QUANTIZATION}.gguf already exists... skipping"
    exit 0
 fi

-if [ -e "/converter/converted_models/cache/models--$model_org--$model_name" ]; then
+if [ -e "/opt/app-root/src/converter/converted_models/cache/models--$model_org--$model_name" ]; then
    echo "$hf_model_url present in cache... skipping download"
 fi

 echo "Downloading $hf_model_url"
-python download_huggingface.py --model $hf_model_url
-python llama.cpp/convert.py /converter/converted_models/$hf_model_url
-python llama.cpp/convert-hf-to-gguf.py /converter/converted_models/$hf_model_url
-mkdir -p /converter/converted_models/gguf/
-llama.cpp/quantize /converter/converted_models/$hf_model_url/ggml-model-f16.gguf /converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf ${QUANTIZATION}
-rm -rf /converter/converted_models/$model_org
+python download_huggingface.py --model $hf_model_url --token $hf_token
+python llama.cpp/examples/convert_legacy_llama.py /opt/app-root/src/converter/converted_models/$hf_model_url
+python llama.cpp/convert_hf_to_gguf.py /opt/app-root/src/converter/converted_models/$hf_model_url
+mkdir -p /opt/app-root/src/converter/converted_models/gguf/
+llama.cpp/llama-quantize /opt/app-root/src/converter/converted_models/$hf_model_url/ggml-model-f16.gguf /opt/app-root/src/converter/converted_models/gguf/$model_org-$model_name-${QUANTIZATION}.gguf ${QUANTIZATION}
+rm -rf /opt/app-root/src/converter/converted_models/$model_org

 if [ $keep_orgi = "False" ]; then
-    rm -rf /converter/converted_models/cache
+    rm -rf /opt/app-root/src/converter/converted_models/cache
 fi

-echo "Converted and quantized model written to /converter/converted_models/gguf/$model_org-$model_name.gguf" 
-echo "$ ls /converter/converted_models/gguf/"
-ls /converter/converted_models/gguf/
+echo "Converted and quantized model written to /opt/app-root/src/converter/converted_models/gguf/$model_org-$model_name.gguf" 
+echo "$ ls /opt/app-root/src/converter/converted_models/gguf/"
+ls /opt/app-root/src/converter/converted_models/gguf/
--- a/convert_models/ui.py
+++ b/convert_models/ui.py
@ -22,6 +22,9 @@ with col2:

 model_name = st.text_input(label="Enter a huggingface model url to convert",
                           placeholder="org/model_name")
+token_id = st.text_input(label="Enter your huggingface token (optional)",
+                         help="huggingface token is required for private model"
+                        ) or "None"
 keep_files = st.checkbox("Keep huggingface model files after conversion?")
 submit_button = st.button(label="submit")
 if submit_button:
@ -31,7 +34,8 @@ if submit_button:
                        "-it", 
                        "--rm", 
                        "-v", f"{volume}:/converter/converted_models", 
-                        "-e", f"HF_MODEL_URL={model_name}" ,
+                        "-e", f"HF_MODEL_URL={model_name}",
+                        "-e", f"HF_TOKEN={token_id}",
                        "-e", f"QUANTIZATION={quantization}",
                        "-e", f"KEEP_ORIGINAL_MODEL={keep_files}",
                        "converter"],stdout=subprocess.PIPE) 
--- a/data/fake_meeting.pdf
+++ b/data/fake_meeting.pdf
--- a/eval/embeddings/custom_eval_set.py
+++ b/eval/embeddings/custom_eval_set.py
@ -0,0 +1,98 @@
+from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddings
+from langchain_openai import ChatOpenAI
+from langchain.chains import LLMChain
+from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+import matplotlib.pyplot as plt
+import os
+from scipy.spatial.distance import cosine
+import streamlit as st
+
+
+model_service = os.getenv("MODEL_ENDPOINT",
+                          "http://localhost:8001")
+model_service = f"{model_service}/v1"
+
+embedding_model = os.getenv("EMBEDDING_MODEL",
+                            "BAAI/bge-base-en-v1.5")
+
+def get_embedding(string, e):
+    embeddings = e.embed_query(string)
+    return embeddings
+
+
+st.title("📊 Create Custom LLM Eval Set")  
+
+if "Question" not in st.session_state:
+    st.session_state["Question"] = "What is the Higgs Boson?"
+
+if "Answers" not in st.session_state:
+    st.session_state["Answers"] = {}
+    st.session_state["Answers"]["Right_Answer_1"] = "The Higgs boson, sometimes called the Higgs particle, is an elementary particle in the Standard Model of particle physics produced by the quantum excitation of the Higgs field, one of the fields in particle physics theory"
+    st.session_state["Answers"]["Wrong_Answer_1"] = "Alan Turing was the first person to conduct substantial research in the field that he called machine intelligence."
+
+st.session_state["Question"] = st.text_input(label="Question", value=st.session_state["Question"])
+
+col1,col2,col3 = st.columns(3)
+with col1:
+    st.session_state["Answers"]["Right_Answer_1"] = st.text_input("Right Answer 1", 
+                                                      value=st.session_state["Answers"]["Right_Answer_1"])
+with col2:
+    st.session_state["Answers"]["Right_Answer_2"] = st.text_input("Right Answer 2")
+
+with col3:
+    st.session_state["Answers"]["Right_Answer_3"] = st.text_input("Right Answer 3")
+
+
+col1,col2,col3 = st.columns(3)
+with col1:
+     st.session_state["Answers"]["Wrong_Answer_1"] = st.text_input("Wrong Answer 1", 
+                                                                  value=st.session_state["Answers"]["Wrong_Answer_1"])
+with col2:
+    st.session_state["Answers"]["Wrong_Answer_2"] = st.text_input("Wrong Answer 2")
+with col3:
+    st.session_state["Answers"]["Wrong_Answer_3"] = st.text_input("Wrong Answer 3")
+
+
+text = {k:[v] for (k,v) in st.session_state["Answers"].items() if v != ""}
+text["Question"] = [st.session_state["Question"]]
+e = SentenceTransformerEmbeddings(model_name=embedding_model)
+
+for t in text.keys():
+    text[t].append(get_embedding(text[t][0],e))
+
+answer_embedding = text["Question"][1]
+
+for t in text.keys():
+    question_embedding = text[t][1]
+    distance = cosine(answer_embedding, question_embedding)
+    text[t].append(round(distance,3))
+
+distances = [text[key][2] for key in text.keys()]
+ones = [1]* len(distances)
+fig = plt.figure()
+plt.vlines(1,.001,1)
+plt.scatter(ones, distances)
+for key in text.keys():
+   plt.annotate(key,(1, text[key][2]))
+plt.xticks([])
+plt.ylabel("Cosine Similarity")
+st.pyplot(fig)
+
+submit = st.button("Check Against Model")
+if submit:
+    llm = ChatOpenAI(base_url=model_service, 
+        api_key="sk-no-key-required")
+    
+    prompt = ChatPromptTemplate.from_messages([
+    ("system", "You are world class technical advisor."),
+    ("user", "{input}")])
+
+    chain = LLMChain(llm=llm, 
+                prompt=prompt,
+                verbose=False,)
+     
+    response = chain.invoke(st.session_state["Question"])
+    st.session_state["Answers"]["LLM Response"] = response["text"]
+    st.markdown(st.session_state["Answers"]["LLM Response"])
+    st.rerun()
+    
--- a/eval/promptfoo/README.md
+++ b/eval/promptfoo/README.md
@ -0,0 +1,15 @@
+# LLM Evaluation with Promptfoo
+
+We are using the [Promptfoo.dev](https://www.promptfoo.dev/) project for LLM model evaluation. 
+
+```
+ podman build -t promptfoo eval/promptfoo/build
+```
+
+Make sure you are running an LLM before starting the promptfoo container. 
+
+```
+podman run -it -p 15500:15500 -v <LOCAL/PATH/TO/>/locallm/eval/promptfoo/evals/:/promptfoo/evals:ro promptfoo
+```
+
+Go to `http://0.0.0.0:15500/setup/` to set up your tests.
--- a/eval/promptfoo/base/Containerfile
+++ b/eval/promptfoo/base/Containerfile
@ -0,0 +1,8 @@
+FROM registry.access.redhat.com/ubi9/nodejs-20-minimal:1-63.1725851021
+WORKDIR /promptfoo
+RUN npm install promptfoo
+ENV PROMPTFOO_DISABLE_TELEMETRY=1
+RUN mkdir evals
+ENV PROMPTFOO_CONFIG_DIR=/promptfoo/evals
+COPY promptfooconfig.yaml /promptfoo
+ENTRYPOINT [ "npx", "promptfoo@latest", "view", "--yes" ]
--- a/eval/promptfoo/base/promptfooconfig.yaml
+++ b/eval/promptfoo/base/promptfooconfig.yaml
@ -0,0 +1,31 @@
+# This configuration compares LLM output of 2 prompts x 2 GPT models across 3 test cases.
+# Learn more: https://promptfoo.dev/docs/configuration/guide
+description: 'My first eval'
+
+prompts:
+  - "Write a tweet about {{topic}}"
+  - "Write a very concise, funny tweet about {{topic}}"
+
+providers:
+  - openai:gpt-3.5-turbo-0613
+  - openai:gpt-4
+
+tests:
+  - vars:
+      topic: bananas
+
+  - vars:
+      topic: avocado toast
+    assert:
+      # For more information on assertions, see https://promptfoo.dev/docs/configuration/expected-outputs
+      - type: icontains
+        value: avocado
+      - type: javascript
+        value: 1 / (output.length + 1)  # prefer shorter outputs
+
+  - vars:
+      topic: new york city
+    assert:
+      # For more information on model-graded evals, see https://promptfoo.dev/docs/configuration/expected-outputs/model-graded
+      - type: llm-rubric
+        value: ensure that the output is funny
--- a/eval/promptfoo/evals/README.md
+++ b/eval/promptfoo/evals/README.md
@ -0,0 +1 @@
+Directory to store evaluation runs locally
--- a/finetune/Containerfile
+++ b/finetune/Containerfile
@ -1,9 +0,0 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
-WORKDIR /locallm
-RUN git clone https://github.com/michaelclifford/llama.cpp.git
-RUN cd llama.cpp/ && make
-ENV DATA=data/data/shakespeare.txt
-ENV MODEL_FILE=data/llama-2-7b-chat.Q5_K_S.gguf
-ENV NEW_MODEL=shakespeare-lora.gguf
-COPY run_finetune.sh /locallm/
-ENTRYPOINT ["sh", "run_finetune.sh"]
--- a/finetune/README.md
+++ b/finetune/README.md
@ -1,59 +0,0 @@
-# Finetuning - with Locallm (MacOS)
-
-In some cases it will be useful for a developers to updated the base language model they are using (like Llama2) with some custom data of their own. In order to do this they can "finetune" the model by partially retraining it with their custom data set. There are a number of ways to do this, and they vary in complexity and computational resource requirements. Here we will continue to rely on the [llama.cpp](https://github.com/ggerganov/llama.cpp) package and do LoRA (Low-Rank Adaption) fine tuning which often requires fewer resources than other fine tuning methods. 
-
-### Use the container image
-
-We have created a pre-built container image for running the finetuning and producing a new model on a mac. The image can be found at [quay.io/michaelclifford/finetunellm](quay.io/michaelclifford/finetunellm). 
-
-```bash
-podman pull quay.io/michaelclifford/finetunellm
-```
-
-It only requires 2 things from a user to start fine tuning. The data they wish to finetune with, and the Llama based model they want to finetune (the current implementation requires a variant of the Llama model).
-
-### Make the data accessible
-
-This is the trickiest part of the current demo and I'm hoping to find a smoother approach moving forward. That said, there are many ways to get data into and out of pods and containers, but here we will rely on exposing a directory on our local machine as a volume for the container. 
-
-This also assumes that `<location/of/your/data/>` contains the following 2 files.
-
-* `llama-2-7b-chat.Q5_K_S.gguf`
-    * [link](https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGUF/resolve/main/llama-2-7b-chat.Q5_K_S.gguf)
-* `data/shakespeare.txt`
-    * [link](https://raw.githubusercontent.com/brunoklein99/deep-learning-notes/master/shakespeare.txt)
-
-### Run the image
-
-```bash
-podman run --rm -it -v <location/of/your/data/>:/locallm/data/ finetunellm
-```
-This will run 10 iterations of LoRA finetuning and generate a new model that can be exported and used in another chat application. I'll caution that 10 iterations is likely insufficient to see a real change in the model outputs, but it serves here for demo purposes.  
-
-### Export the model
-
-Now that we have our finedtuned model we will want to move it out of the Podman machine and onto our local host for use by another application. Again, I'm sure there are better ways to do this long term.
-
-Here we will rely on Podman's copy function to move the model.
-```bash
-podman cp <container name>:<model_file> <location/of/your/data>
-```
-
-### Customize the finetuning 
-
-If you would like to use a different model or dataset, you can replace the training data file in `data/` as well as the `.gguf` model file. However, for now llama.cpp finetuning requires a Llama variant model to be used. 
-
-To change the data and model used you can set the following environment variables when starting a new container. 
-
-* `DATA=data/data/<new-data-file>`
-* `MODEL_FILE=data/<new-model-file.gguf>`
-* `NEW_MODEL=<name-of-new-finetuned-model.gguf>`
-
-```bash
-podman run -it -v <location/of/your/data/>:/locallm/data/ \ 
-e MODEL_FILE=data/<new-model-file.gguf> \
-e DATA=darta/data/<new-data-file> \
-e NEW_MODEL=<name-of-new-finetuned-model.gguf> 
- finetunellm
-
-```
--- a/finetune/run_finetune.sh
+++ b/finetune/run_finetune.sh
@ -1,23 +0,0 @@
-#! /bin/bash
-
-llama.cpp/finetune \
-    --model-base $MODEL_FILE \
-    --checkpoint-in  chk-lora-llama-7b-chat-Q5-shakespeare-LATEST.gguf \
-    --checkpoint-out chk-lora-llama-7b-chat-Q5-shakespeare-ITERATION.gguf \
-    --lora-out lora-llama-7b-chat-Q5-shakespeare-ITERATION.bin \
-    --train-data $DATA \
-    --save-every 10 \
-    --threads 10 --adam-iter 10 --batch 4 --ctx 64 \
-    --use-checkpointing \
-
-llama.cpp/export-lora \
-    --model-base $MODEL_FILE \
-    --model-out $NEW_MODEL \
-    --lora-scaled lora-llama-7b-chat-Q5-shakespeare-LATEST.bin 1.0
-
-echo "Fine Tuning Complete... 
-Please move trained model to desired location 
-
-Example: 'podman cp <container name>:<model_file> .' from the host machine" 
-
-bash
--- a/hooks/pre-commit
+++ b/hooks/pre-commit
@ -0,0 +1,13 @@
+#!/bin/bash
+
+SOURCE_FILE="training/ilab-wrapper/ilab"
+DEST_FILE="training/nvidia-bootc/duplicated/ilab-wrapper/ilab"
+
+if [[ -f "$SOURCE_FILE" ]]; then
+  mkdir -p "$(dirname "$DEST_FILE")"
+  cp "$SOURCE_FILE" "$DEST_FILE"
+  git add "$DEST_FILE"
+else
+  echo "Source file $SOURCE_FILE does not exist. Aborting commit."
+  exit 1
+fi
--- a/install-hooks.sh
+++ b/install-hooks.sh
@ -0,0 +1,8 @@
+#!/bin/bash
+
+HOOKS_DIR="hooks"
+GIT_HOOKS_DIR=".git/hooks"
+
+cp "$HOOKS_DIR/pre-commit" "$GIT_HOOKS_DIR/pre-commit"
+
+echo "Hooks installed successfully."
--- a/model_servers/common/Makefile.common
+++ b/model_servers/common/Makefile.common
@ -1,6 +1,8 @@
+CONTAINER_TOOL ?= podman
 REGISTRY ?= quay.io
 REGISTRY_ORG ?= ai-lab
 COMPONENT ?= model_servers
+CHAT_FORMAT ?=

 BIND_MOUNT_OPTIONS := ro
 OS := $(shell uname -s)
@ -10,7 +12,7 @@ endif

 .PHONY: build
 build:
-	podman build --squash-all --build-arg $(PORT) -t $(IMAGE) . -f base/Containerfile
+	podman build --squash-all --build-arg PORT=$(PORT) -t $(IMAGE) . -f base/Containerfile

 .PHONY: install
 install:
@ -35,7 +37,15 @@ clean:
 .PHONY: run
 run:
 	cd ../../models && \
-	podman run -it -d -p $(PORT):$(PORT) -v ./$(MODEL_NAME):$(MODELS_PATH)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) -e MODEL_PATH=$(MODELS_PATH)/$(MODEL_NAME) -e HOST=0.0.0.0 -e PORT=$(PORT) $(IMAGE)
+	podman run -it \
+		-d \
+		-p $(PORT):$(PORT) \
+		-v ./$(MODEL_NAME):$(MODELS_PATH)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) \
+		-e MODEL_PATH=$(MODELS_PATH)/$(MODEL_NAME) \
+		-e HOST=0.0.0.0 \
+		-e PORT=$(PORT) \
+		$(CHAT_FORMAT:%=-e CHAT_FORMAT=${CHAT_FORMAT}) \
+		$(IMAGE)

 .PHONY: podman-clean
 podman-clean:
--- a/model_servers/llamacpp_python/Makefile
+++ b/model_servers/llamacpp_python/Makefile
@ -1,5 +1,6 @@
 APP := llamacpp_python
 PORT ?= 8001
+CHAT_FORMAT ?=

 include ../common/Makefile.common

@ -9,20 +10,22 @@ CUDA_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_cuda:latest
 VULKAN_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_vulkan:latest

 MODELS_PATH := /locallm/models
-MODEL_NAME ?= mistral-7b-instruct-v0.1.Q4_K_M.gguf
+MODEL_NAME ?= granite-7b-lab-Q4_K_M.gguf

 .Phony: all
-all: build download-model-mistral run
+all: build download-model-granite run

 .PHONY: build-cuda
 build-cuda:
-	podman build --squash-all -t $(CUDA_IMAGE) . -f cuda/Containerfile
+	"${CONTAINER_TOOL}"  build --squash-all -t $(CUDA_IMAGE) . -f cuda/Containerfile

-.PHONY: build-vulkan
-build-vulkan:
-	podman build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/Containerfile
+.PHONY: build-vulkan-amd64 build-vulkan-arm64
+build-vulkan-amd64:
+	"${CONTAINER_TOOL}"  build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/amd64/Containerfile
+build-vulkan-arm64:
+	"${CONTAINER_TOOL}"  build --squash-all -t $(VULKAN_IMAGE) . -f vulkan/arm64/Containerfile

-.PHONY: download-model-mistral # default model
-download-model-mistral:
-	cd ../../models && \
-	make MODEL_NAME=mistral-7b-instruct-v0.1.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf -f  Makefile download-model
+.PHONY: download-model-granite # default model
+download-model-granite:
+	cd ../../models/ && \
+	make download-model-granite
--- a/model_servers/llamacpp_python/README.md
+++ b/model_servers/llamacpp_python/README.md
@ -1,53 +1,56 @@
-# Llamacpp_Python Model Sever
+# Llamacpp_Python Model Server

 The llamacpp_python model server images are based on the [llama-cpp-python](https://github.com/abetlen/llama-cpp-python) project that provides python bindings for [llama.cpp](https://github.com/ggerganov/llama.cpp). This provides us with a python based and OpenAI API compatible model server that can run LLM's of various sizes locally across Linux, Windows or Mac.

-This model server requires models to be converted from their original format, typically a set of `*.bin` or `*.safetensor` files into a single GGUF formatted file. Many models are available in GGUF format already on [huggingface.co](https://huggingface.co). You can also use the [model converter utility](../../convert_models/) available in this repo to convert models yourself.      
+This model server requires models to be converted from their original format, typically a set of `*.bin` or `*.safetensor` files into a single GGUF formatted file. Many models are available in GGUF format already on [huggingface.co](https://huggingface.co). You can also use the [model converter utility](../../convert_models/) available in this repo to convert models yourself.


 ## Image Options

-We currently provide 3 options for the llamacpp_python model server: 
-* [Base](#base) 
+We currently provide 3 options for the llamacpp_python model server:
+* [Base](#base)
 * [Cuda](#cuda)
-* [Vulkan (experimental)](#vulkan-experimental) 
+* [Vulkan (experimental)](#vulkan-experimental)

 ### Base

-The [base image](../llamacpp_python/base/Containerfile) is the standard image that works for both arm64 and amd64 environments. However, it does not includes any hardware acceleration and will run with CPU only. If you use the base image, make sure that your container runtime has sufficient resources to run the desired model(s).   
+The [base image](../llamacpp_python/base/Containerfile) is the standard image that works for both arm64 and amd64 environments. However, it does not includes any hardware acceleration and will run with CPU only. If you use the base image, make sure that your container runtime has sufficient resources to run the desired model(s).

 To build the base model service image:

 ```bash
-make -f Makefile build
+make build
 ```
+
 To pull the base model service image:

 ```bash
-podman pull quay.io/ai-lab/llamacpp-python
+podman pull quay.io/ai-lab/llamacpp_python
 ```


 ### Cuda

-The [Cuda image](../llamacpp_python/cuda/Containerfile) include all the extra drivers necessary to run our model server with Nvidia GPUs. This will significant speed up the models response time over CPU only deployments.   
+The [Cuda image](../llamacpp_python/cuda/Containerfile) include all the extra drivers necessary to run our model server with Nvidia GPUs. This will significant speed up the models response time over CPU only deployments.

 To Build the the Cuda variant image:
+
 ```bash
-make -f Makefile build-cuda
+make build-cuda
 ```

 To pull the base model service image:

 ```bash
-podman pull quay.io/ai-lab/llamacpp-python-cuda
+podman pull quay.io/ai-lab/llamacpp_python_cuda
 ```

 **IMPORTANT!**

-To run the Cuda image with GPU acceleration, you need to install the correct [Cuda drivers](https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#driver-installation) for your system along with the [Nvidia Container Toolkit](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html#). Please use the links provided to find installation instructions for your system. 
+To run the Cuda image with GPU acceleration, you need to install the correct [Cuda drivers](https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#driver-installation) for your system along with the [Nvidia Container Toolkit](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html#). Please use the links provided to find installation instructions for your system.
+
+Once those are installed you can use the container toolkit CLI to discover your Nvidia device(s).

-Once those are installed you can use the container toolkit CLI to discover your Nvidia device(s). 
 ```bash
 sudo nvidia-ctk cdi generate --output=/etc/cdi/nvidia.yaml
 ```
@ -57,35 +60,37 @@ Finally, you will also need to add `--device nvidia.com/gpu=all` to your `podman

 ### Vulkan (experimental)

-The [Vulkan image](../llamacpp_python/vulkan/Containerfile) is experimental, but can be used for gaining partial GPU access on an M-series Mac, significantly speeding up model response time over a CPU only deployment. This image requires that your podman machine provider is "applehv" and that you use krunkit instead of vfkit. Since these tools are not currently supported by podman desktop this image will remain "experimental".    
+The [Vulkan](https://docs.vulkan.org/guide/latest/what_is_vulkan.html) image ([amd64](../llamacpp_python/vulkan/amd64/Containerfile)/[arm64](../llamacpp_python/vulkan/arm64/Containerfile)) is experimental, but can be used for gaining partial GPU access on an M-series Mac, significantly speeding up model response time over a CPU only deployment. This image requires that your podman machine provider is "applehv" and that you use krunkit instead of vfkit. Since these tools are not currently supported by podman desktop this image will remain "experimental".

 To build the Vulkan model service variant image:

-```bash
-make -f Makefile build-vulkan
-```
+| System Architecture | Command |
+|---|---|
+| amd64 | make build-vulkan-amd64 |
+| arm64 | make build-vulkan-arm64 |
+
 To pull the base model service image:

 ```bash
-podman pull quay.io/ai-lab/llamacpp-python-vulkan
+podman pull quay.io/ai-lab/llamacpp_python_vulkan
 ```


-
 ## Download Model(s)

 There are many models to choose from these days, most of which can be found on [huggingface.co](https://huggingface.co). In order to use a model with the llamacpp_python model server, it must be in GGUF format. You can either download pre-converted GGUF models directly or convert them yourself with the [model converter utility](../../convert_models/) available in this repo.

-One of the more popular Apache-2.0 Licenesed models that we recommend using if you are just getting started is `mistral-7b-instruct-v0.1`. You can use the link below to quickly download a quantized (smaller) GGUF version of this model for use with the llamacpp_python model server. 
+A well performant Apache-2.0 licensed models that we recommend using if you are just getting started is
+`granite-7b-lab`. You can use the link below to quickly download a quantized (smaller) GGUF version of this model for use with the llamacpp_python model server.

-Download URL: [https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf](https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf)
+Download URL: [https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf](https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf)

 Place all models in the [models](../../models/) directory.

 You can use this snippet below to download the default model:

 ```bash
-make -f Makefile download-model-mistral
+make download-model-granite
 ```

 Or you can use the generic `download-models` target from the `/models` directory to download any model file from huggingface:
@ -93,7 +98,7 @@ Or you can use the generic `download-models` target from the `/models` directory
 ```bash
 cd ../../models
 make MODEL_NAME=<model_name> MODEL_URL=<model_url> -f  Makefile download-model
-# EX: make MODEL_NAME=mistral-7b-instruct-v0.1.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf -f  Makefile download-model
+# EX: make MODEL_NAME=granite-7b-lab-Q4_K_M.gguf MODEL_URL=https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf -f  Makefile download-model
 ```


@ -104,32 +109,35 @@ make MODEL_NAME=<model_name> MODEL_URL=<model_url> -f  Makefile download-model
 To deploy the LLM server you must specify a volume mount `-v` where your models are stored on the host machine and the `MODEL_PATH` for your model of choice. The model_server is most easily deploy from calling the make command: `make -f Makefile run`. Of course as with all our make calls you can pass any number of the following variables: `REGISTRY`, `IMAGE_NAME`, `MODEL_NAME`, `MODEL_PATH`, and `PORT`.

 ```bash
-podman run --rm -it \
+podman run --rm -d \
  -p 8001:8001 \
  -v Local/path/to/locallm/models:/locallm/models:ro \
-  -e MODEL_PATH=models/mistral-7b-instruct-v0.1.Q4_K_M.gguf 
-  -e HOST=0.0.0.0 
-  -e PORT=8001 
-  llamacpp_python \
+  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf \
+  -e HOST=0.0.0.0 \
+  -e PORT=8001 \
+  -e MODEL_CHAT_FORMAT=openchat \
+  llamacpp_python
 ```

 or with Cuda image

 ```bash
-podman run --rm -it \
-  --device nvidia.com/gpu=all
+podman run --rm -d \
+  --device nvidia.com/gpu=all \
  -p 8001:8001 \
  -v Local/path/to/locallm/models:/locallm/models:ro \
-  -e MODEL_PATH=models/mistral-7b-instruct-v0.1.Q4_K_M.gguf 
-  -e HOST=0.0.0.0 
-  -e PORT=8001 
-  llamacpp_python \
+  -e MODEL_PATH=models/granite-7b-lab-Q4_K_M.gguf \
+  -e HOST=0.0.0.0 \
+  -e PORT=8001 \
+  -e MODEL_CHAT_FORMAT=openchat \
+  llamacpp_python
 ```
+
 ### Multiple Model Service:

 To enable dynamic loading and unloading of different models present on your machine, you can start the model service with a `CONFIG_PATH` instead of a `MODEL_PATH`.

-Here is an example `models_config.json` with two quantization variants of mistral-7B.
+Here is an example `models_config.json` with two model options.

 ```json
 {
@ -137,24 +145,24 @@ Here is an example `models_config.json` with two quantization variants of mistra
    "port": 8001,
    "models": [
        {
-            "model": "models/mistral-7b-instruct-v0.1.Q4_K_M.gguf",
-            "model_alias": "mistral_Q4",
-            "chat_format": "mistral",
+            "model": "models/granite-7b-lab-Q4_K_M.gguf",
+            "model_alias": "granite",
+            "chat_format": "openchat",
        },
        {
-            "model": "models/mistral-7b-instruct-v0.1.Q5_K_M.gguf",
-            "model_alias": "mistral_Q5",
-            "chat_format": "mistral",
+            "model": "models/merlinite-7b-lab-Q4_K_M.gguf",
+            "model_alias": "merlinite",
+            "chat_format": "openchat",
        },

    ]
 }
 ```

-Now run the container with the specified config file. 
+Now run the container with the specified config file.

 ```bash
-podman run --rm -it -d \
+podman run --rm -d \
        -p 8001:8001 \
        -v Local/path/to/locallm/models:/locallm/models:ro \
        -e CONFIG_PATH=models/<config-filename> \
@ -169,4 +177,4 @@ Running tests

 ```bash
 make -f Makefile test
-```
+```
--- a/model_servers/llamacpp_python/base/Containerfile
+++ b/model_servers/llamacpp_python/base/Containerfile
@ -1,6 +1,9 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY src .
-RUN pip install --no-cache-dir --verbose -r ./requirements.txt
+USER root
+RUN dnf install -y gcc-toolset-13-gcc gcc-toolset-13-gcc-c++
+USER 1001
+RUN CC="/opt/rh/gcc-toolset-13/root/usr/bin/gcc" CXX="/opt/rh/gcc-toolset-13/root/usr/bin/g++"  pip install --no-cache-dir --verbose -r ./requirements.txt
 EXPOSE 8001
 ENTRYPOINT [ "sh", "./run.sh" ]
--- a/model_servers/llamacpp_python/cuda/Containerfile
+++ b/model_servers/llamacpp_python/cuda/Containerfile
@ -1,7 +1,10 @@
 FROM quay.io/opendatahub/workbench-images:cuda-ubi9-python-3.9-20231206
+USER root
+RUN  dnf install -y gcc-toolset-13-gcc gcc-toolset-13-gcc-c++
+USER 1001
 WORKDIR /locallm
 COPY src .
-ENV CMAKE_ARGS="-DLLAMA_CUBLAS=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
+ENV CMAKE_ARGS="-DGGML_CUDA=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
 ENV FORCE_CMAKE=1
-RUN pip install --no-cache-dir -r ./requirements.txt
+RUN CC="/opt/rh/gcc-toolset-13/root/usr/bin/gcc" CXX="/opt/rh/gcc-toolset-13/root/usr/bin/g++" pip install --no-cache-dir -r ./requirements.txt
 ENTRYPOINT [ "sh", "run.sh" ]
--- a/model_servers/llamacpp_python/src/requirements.txt
+++ b/model_servers/llamacpp_python/src/requirements.txt
@ -1,2 +1,3 @@
-llama-cpp-python[server]==0.2.61
+llama-cpp-python[server]==0.2.90
+transformers==4.41.2
 pip==24.0
--- a/model_servers/llamacpp_python/src/run.sh
+++ b/model_servers/llamacpp_python/src/run.sh
@ -4,8 +4,21 @@ if [ ${CONFIG_PATH} ] || [[ ${MODEL_PATH} && ${CONFIG_PATH} ]]; then
    exit 0
 fi

+if [ "${MODEL_HF_PRETRAINED_MODEL}" == "None" ]; then
+    MODEL_HF_PRETRAINED_MODEL=""
+fi
+
 if [ ${MODEL_PATH} ]; then
-    python -m llama_cpp.server --model ${MODEL_PATH} --host ${HOST:=0.0.0.0} --port ${PORT:=8001} --n_gpu_layers ${GPU_LAYERS:=0} --clip_model_path ${CLIP_MODEL_PATH:=None} --chat_format ${MODEL_CHAT_FORMAT:="llama-2"}
+    python -m llama_cpp.server \
+        --model ${MODEL_PATH} \
+        --host ${HOST:=0.0.0.0} \
+        --port ${PORT:=8001} \
+        --n_gpu_layers ${GPU_LAYERS:=0} \
+        --clip_model_path ${CLIP_MODEL_PATH:=None} \
+        --chat_format ${MODEL_CHAT_FORMAT:=llama-2} \
+        ${PRETRAINED_MODEL_PATH:=} \
+        ${MODEL_HF_PRETRAINED_MODEL:+--hf_pretrained_model_name_or_path ${MODEL_HF_PRETRAINED_MODEL}} \
+        --interrupt_requests ${INTERRUPT_REQUESTS:=False}
    exit 0
 fi

--- a/model_servers/llamacpp_python/tests/conftest.py
+++ b/model_servers/llamacpp_python/tests/conftest.py
@ -13,7 +13,7 @@ else:
    IMAGE_NAME = os.environ['IMAGE_NAME']

 if not 'MODEL_NAME' in os.environ:
-    MODEL_NAME = 'mistral-7b-instruct-v0.1.Q4_K_M.gguf'
+    MODEL_NAME = 'granite-7b-lab-Q4_K_M.gguf'
 else: 
    MODEL_NAME = os.environ['MODEL_NAME']

--- a/model_servers/llamacpp_python/tooling_options.ipynb
+++ b/model_servers/llamacpp_python/tooling_options.ipynb
@ -23,7 +23,7 @@
    "This notebook assumes that the playground image is running locally. Once built, you can use the below to start the model service image. \n",
    "\n",
    "```bash\n",
-    "podman run -it -p 8000:8000 -v <YOUR-LOCAL-PATH>/locallm/models:/locallm/models:Z -e MODEL_PATH=models/mistral-7b-instruct-v0.1.Q4_K_M.gguf playground\n",
+    "podman run -it -p 8000:8000 -v <YOUR-LOCAL-PATH>/locallm/models:/locallm/models:Z -e MODEL_PATH=models/mistral-7b-instruct-v0.2.Q4_K_M.gguf playground\n",
    "```"
   ]
  },
@ -203,7 +203,7 @@
    "from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler\n",
    "\n",
    "\n",
-    "llm = OpenAI(temperature=0.9,model_name=\"llama2\", base_url=\"http://localhost:8000/v1\", \n",
+    "llm = OpenAI(temperature=0.9,model_name=\"instructlab/granite-7b-lab\", base_url=\"http://localhost:8000/v1\", \n",
    "             openai_api_key=\"sk-no-key-required\", streaming=True,\n",
    "             callbacks=[StreamingStdOutCallbackHandler()])\n",
    "text = \"What would be a good company name for a company that makes colorful socks?\"\n",
--- a/model_servers/llamacpp_python/vulkan/amd64/Containerfile
+++ b/model_servers/llamacpp_python/vulkan/amd64/Containerfile
@ -0,0 +1,17 @@
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
+USER 0
+RUN dnf install -y python3-dnf-plugin-versionlock
+RUN dnf install -y mesa-vulkan-drivers-24.1.2-3.el9.x86_64
+RUN dnf versionlock mesa-vulkan-drivers-24.1.2-3.el9.x86_64
+RUN dnf install -y https://dl.fedoraproject.org/pub/epel/epel-release-latest-9.noarch.rpm
+RUN dnf install -y git cmake ninja-build gcc gcc-c++ 
+RUN dnf copr enable -y ligenix/enterprise-sandbox epel-9-x86_64
+RUN dnf install -y vulkan-headers vulkan-tools
+USER 1001
+WORKDIR /locallm
+COPY src .
+RUN pip install --upgrade pip
+ENV CMAKE_ARGS="-DLLAMA_VULKAN=on"
+ENV FORCE_CMAKE=1
+RUN pip install --no-cache-dir --upgrade -r /locallm/requirements.txt
+ENTRYPOINT [ "sh", "run.sh" ]
--- a/model_servers/llamacpp_python/vulkan/arm64/Containerfile
+++ b/model_servers/llamacpp_python/vulkan/arm64/Containerfile
@ -1,9 +1,11 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 USER 0
 RUN dnf install -y python3-dnf-plugin-versionlock && \
+    dnf install -y \
+https://dl.fedoraproject.org/pub/epel/epel-release-latest-9.noarch.rpm && \
    dnf copr enable -y slp/mesa-krunkit epel-9-aarch64 && \
-    dnf install -y mesa-vulkan-drivers-23.3.3-101.el9.aarch64 && \
-    dnf versionlock mesa-vulkan-drivers-23.3.3-101.el9.aarch64 && \
+    dnf install -y mesa-vulkan-drivers-24.1.2-101.el9.aarch64 && \
+    dnf versionlock mesa-vulkan-drivers-24.1.2-101.el9.aarch64 && \
    dnf install -y git cmake ninja-build gcc gcc-c++ vulkan-loader-devel vulkan-tools
 USER 1001
 WORKDIR /locallm
--- a/model_servers/object_detection_python/Makefile
+++ b/model_servers/object_detection_python/Makefile
@ -1,35 +1,33 @@
 APP := object_detection_python
 PORT ?= 8000

-include ../common/Makefile.common
-
-IMAGE_NAME ?= $(REGISTRY_ORG)/$(COMPONENT)/$(APP):latest
-IMAGE := $(REGISTRY)/$(IMAGE_NAME)
-CUDA_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_cuda:latest
-VULKAN_IMAGE := $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/$(APP)_vulkan:latest
-
+REGISTRY ?= ghcr.io
+REGISTRY_ORG ?= containers

 MODEL_NAME ?= facebook/detr-resnet-101
-MODELS_DIR := /models
+MODELS_DIR := /app/models

+include ../common/Makefile.common
+
+IMAGE_NAME ?= $(REGISTRY_ORG)/$(APP):latest
+IMAGE := $(REGISTRY)/$(IMAGE_NAME)
+
+# Run override required because of the multi-directory models and model_path vs models_dir
 .PHONY: run
 run:
 	cd ../../models && \
 	podman run -it -d -p $(PORT):$(PORT) -v ./$(MODEL_NAME):$(MODELS_DIR)/$(MODEL_NAME):$(BIND_MOUNT_OPTIONS) -e MODEL_PATH=$(MODELS_DIR)/$(MODEL_NAME) -e HOST=0.0.0.0 -e PORT=$(PORT) $(IMAGE)

-
 .PHONY: all
 all: build download-model-facebook-detr-resnet-101 run 

 .PHONY: download-model-facebook-detr-resnet-101
 download-model-facebook-detr-resnet-101:
-	pip install -r ../../convert_models/requirements.txt
-	cd ../../convert_models/ && \
-	python3.11 download_huggingface.py -m facebook/detr-resnet-101
-	cp -r ../../convert_models/converted_models/facebook ../../models/
+	cd ../../models && \
+	make download-model-facebook-detr-resnet-101

 .PHONY: test
 test:
-	$(MAKE) download-model-facebook-detr-resnet-101
-	ln -s ../../models/detr-resnet-101 ./
-	PORT=$(PORT) MODEL_NAME=$(MODEL_NAME) MODELS_PATH=$(MODELS_PATH) IMAGE=$(IMAGE) PULL_ALWAYS=0 pytest -s -vvv
+	pip install -r ../../convert_models/requirements.txt
+	cp -r ../../models/facebook ./
+	REGISTRY=$(REGISTRY) MODEL_NAME=$(MODEL_NAME) MODELS_DIR=$(MODELS_DIR) IMAGE_NAME=$(IMAGE_NAME) PORT=$(PORT) pytest -s -vvv
--- a/model_servers/object_detection_python/README.md
+++ b/model_servers/object_detection_python/README.md
@ -0,0 +1,52 @@
+# Object_Detection_Python Model Server
+
+The object_detection_python model server is a simple [FastAPI](https://fastapi.tiangolo.com/) application written specifically for use in the [object_detection recipe](../../recipes/computer_vision/object_detection/) with "DEtection TRansformer" (DETR) models.  It relies on huggingface's transformer package for `AutoImageProcessor` and `AutoModelforObjectDetection` to process image data and to make inferences respectively.
+
+Currently, the server only implements a single endpoint, `/detection`, that expects an image in bytes and returns an image with labeled bounding boxes and the probability scores of each bounding box. 
+
+## Build Model Server
+
+To build the object_detection_python model server image from this directory:
+
+```bash
+podman build -t object_detection_python . base/Containerfile
+```
+or
+```bash
+make build
+```
+
+## Download Model(s)
+
+You can download models from [huggingface.co](https://huggingface.co/) for this model server. This model server is intended to be used with "DEtection TRansformer" (DETR) models. The default model we've used and validated is [facebook/detr-resnet-101](https://huggingface.co/facebook/detr-resnet-101).
+
+You can download a copy of this model into your `models/` with the make command below. 
+
+```bash
+ make download-model-facebook-detr-resnet-101
+```
+or any model with 
+
+```bash
+cd ../../models/ && \
+python download_hf_models.py -m <MODEL>
+```
+
+
+## Deploy Model Server
+
+The model server relies on a volume mount to the localhost to access the model files. It also employs environment variables to dictate the model used and where its served. You can start your model server using the following `make` command from the [`model_servers/object_detection_python`](../../../model_servers/object_detection_python) directory, which will be set with reasonable defaults:
+
+```bash
+make run
+```
+or 
+
+```bash
+podman run -it -d -p 8000:8000 \
+-v <LOCAL/PATH/TO/MODLES>/facebook/detr-resnet-101:/models/facebook/detr-resnet-101:ro \
+-e MODEL_PATH=/models/facebook/detr-resnet-101 \
+-e HOST=0.0.0.0 \
+-e PORT=8000 \
+ghcr.io/ai-lab/model_servers/object_detection_python:latest 
+```
--- a/model_servers/object_detection_python/base/Containerfile
+++ b/model_servers/object_detection_python/base/Containerfile
@ -1,9 +1,8 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 ARG PORT=8000
 WORKDIR /app
-COPY src/requirements.txt .
+COPY src .
 RUN pip install --upgrade pip && \
    pip install --no-cache-dir --upgrade -r requirements.txt
-COPY src/object_detection_server.py .
 EXPOSE $PORT
-ENTRYPOINT [ "uvicorn", "object_detection_server:app", "--host", "0.0.0.0" ]
+ENTRYPOINT [ "sh", "./run.sh" ]
--- a/model_servers/object_detection_python/src/object_detection_server.py
+++ b/model_servers/object_detection_python/src/object_detection_server.py
@ -11,7 +11,7 @@ import shutil


 app = FastAPI()
-model = os.getenv("MODEL_PATH", default="facebook/detr-resnet-101")
+model = os.getenv("MODEL_PATH", default="/app/models/facebook/detr-resnet-101")
 revision = os.getenv("MODEL_REVISION", default="no_timm")

 if os.path.isfile(model):
@ -30,6 +30,10 @@ else:
 class Item(BaseModel):
    image: bytes 

+@app.get("/health")
+def tests_alive():
+    return {"alive": True}
+
@app.post("/detection")
 def detection(item: Item):
    b64_image = item.image
--- a/model_servers/object_detection_python/src/requirements-unlocked.txt
+++ b/model_servers/object_detection_python/src/requirements-unlocked.txt
@ -0,0 +1,8 @@
+fastapi
+pillow
+pydantic
+requests
+transformers
+torch
+uvicorn
+timm
--- a/model_servers/object_detection_python/src/requirements.txt
+++ b/model_servers/object_detection_python/src/requirements.txt
@ -1,36 +1,55 @@
-annotated-types==0.6.0
-anyio==4.3.0
-certifi==2024.2.2
+annotated-types==0.7.0
+anyio==4.4.0
+certifi==2024.6.2
 charset-normalizer==3.3.2
-click==8.1.7
-fastapi==0.110.1
-filelock==3.13.4
-fsspec==2024.3.1
-h11==0.14.0
-huggingface-hub==0.22.2
+click==8.1.8
+dnspython==2.6.1
+email_validator==2.2.0
+fastapi==0.111.1
+fastapi-cli==0.0.7
+filelock==3.15.4
+fsspec==2024.6.1
+h11==0.16.0
+httpcore==1.0.9
+httptools==0.6.4
+httpx==0.27.2
+huggingface-hub==0.23.4
 idna==3.7
-Jinja2==3.1.3
+Jinja2==3.1.6
+markdown-it-py==3.0.0
 MarkupSafe==2.1.5
+mdurl==0.1.2
 mpmath==1.3.0
 networkx==3.3
-numpy==1.26.4
-packaging==24.0
+numpy==2.0.1
+orjson==3.10.18
+packaging==24.1
 pillow==10.3.0
-pydantic==2.6.4
-pydantic_core==2.16.3
-PyYAML==6.0.1
-regex==2023.12.25
-requests==2.31.0
-safetensors==0.4.3
+pydantic==2.7.4
+pydantic_core==2.18.4
+Pygments==2.18.0
+python-dotenv==1.0.1
+python-multipart==0.0.20
+PyYAML==6.0.2
+regex==2024.5.15
+requests==2.32.3
+rich==13.7.1
+safetensors==0.4.5
+shellingham==1.5.4
 sniffio==1.3.1
 starlette==0.37.2
-sympy==1.12
-timm==0.9.16
-tokenizers==0.15.2
-torch==2.2.2
-torchvision==0.17.2
-tqdm==4.66.2
-transformers==4.39.3
-typing_extensions==4.11.0
-urllib3==2.2.1
-uvicorn==0.29.0
+sympy==1.12.1
+timm==1.0.15
+tokenizers==0.19.1
+torch==2.3.1
+torchvision==0.18.1
+tqdm==4.66.5
+transformers==4.41.2
+typer==0.12.5
+typing_extensions==4.12.2
+ujson==5.10.0
+urllib3==2.2.3
+uvicorn==0.30.6
+uvloop==0.19.0
+watchfiles==0.22.0
+websockets==12.0
--- a/model_servers/object_detection_python/src/run.sh
+++ b/model_servers/object_detection_python/src/run.sh
@ -0,0 +1,9 @@
+#!/bin/bash
+
+if [ ${MODEL_PATH} ]; then
+    PORT=${PORT} MODEL_PATH=${MODEL_PATH} uvicorn object_detection_server:app --port ${PORT:=8000} --host ${HOST:=0.0.0.0}
+    exit 0
+fi
+
+echo "Please set either a MODEL_PATH"
+exit 1
--- a/model_servers/object_detection_python/tests/init.py
+++ b/model_servers/object_detection_python/tests/init.py
--- a/model_servers/object_detection_python/tests/conftest.py
+++ b/model_servers/object_detection_python/tests/conftest.py
@ -0,0 +1,46 @@
+import pytest_container
+import os
+
+REGISTRY = os.getenv("REGISTRY", "ghcr.io")
+IMAGE_NAME = os.getenv("IMAGE_NAME", "containers/object_detection_python:latest")
+MODEL_NAME = os.getenv("MODEL_NAME", "facebook/detr-resnet-101")
+MODELS_DIR = os.getenv("MODELS_DIR", "/app/models")
+
+MODEL_PATH = f"{MODELS_DIR}/{MODEL_NAME}"
+
+PORT = os.getenv("PORT", 8000)
+if type(PORT) == str:
+    try:
+        PORT = int(PORT)
+    except:
+        PORT = 8000
+
+MS = pytest_container.Container(
+        url=f"containers-storage:{REGISTRY}/{IMAGE_NAME}",
+        volume_mounts=[
+            pytest_container.container.BindMount(
+                container_path=f"{MODEL_PATH}",
+                host_path=f"./{MODEL_NAME}",
+                flags=["ro"]
+            )
+        ],
+        extra_environment_variables={
+            "MODEL_PATH": f"{MODEL_PATH}",
+            "HOST": "0.0.0.0",
+            "PORT": f"{PORT}",
+            "IMAGE_NAME": f"{IMAGE_NAME}",
+            "REGISTRY": f"{REGISTRY}"
+        },
+        forwarded_ports=[
+            pytest_container.PortForwarding(
+                container_port=PORT,
+                host_port=PORT
+            )
+        ],
+    )
+
+def pytest_generate_tests(metafunc):
+    pytest_container.auto_container_parametrize(metafunc)
+
+def pytest_addoption(parser):
+    pytest_container.add_logging_level_options(parser)
--- a/model_servers/object_detection_python/tests/requirements.txt
+++ b/model_servers/object_detection_python/tests/requirements.txt
@ -0,0 +1,8 @@
+pip==24.0
+pytest-container==0.4.0
+pytest-selenium==4.1.0
+pytest-testinfra==10.1.0
+pytest==8.1.1
+requests==2.31.0
+selenium==4.19.0
+tenacity==8.2.3
--- a/model_servers/object_detection_python/tests/test_alive.py
+++ b/model_servers/object_detection_python/tests/test_alive.py
@ -0,0 +1,12 @@
+import pytest_container
+from .conftest import MS
+import tenacity
+
+CONTAINER_IMAGES = [MS]
+
+def test_etc_os_release_present(auto_container: pytest_container.container.ContainerData):
+    assert auto_container.connection.file("/etc/os-release").exists
+
+@tenacity.retry(stop=tenacity.stop_after_attempt(5), wait=tenacity.wait_exponential())
+def test_alive(auto_container: pytest_container.container.ContainerData, host):
+    host.run_expect([0],f"curl http://localhost:{auto_container.forwarded_ports[0].host_port}",).stdout.strip()
--- a/model_servers/whispercpp/Makefile
+++ b/model_servers/whispercpp/Makefile
@ -14,7 +14,7 @@ MODEL_NAME ?= ggml-small.bin
 .PHONY: all
 all: build download-model-whisper-small run

-.PHONY: download-model-whisper-small # small .bin model type testing
+.PHONY: download-model-whisper-small
 download-model-whisper-small:
 	cd ../../models && \
-	make MODEL_NAME=ggml-small.bin MODEL_URL=https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin -f Makefile download-model
+	make download-model-whisper-small
--- a/model_servers/whispercpp/base/Containerfile
+++ b/model_servers/whispercpp/base/Containerfile
@ -19,6 +19,10 @@ COPY --from=builder /app /app
 COPY --from=mwader/static-ffmpeg:6.1.1 /ffmpeg /bin/
 COPY --from=mwader/static-ffmpeg:6.1.1 /ffprobe /bin/

-COPY src /app/
+COPY --chown=0:0 --chmod=755 src /app
+RUN chown 1001:1001 /app
+
+USER 1001
+
 ENV AUDIO_FILE=/app/jfk.wav
 ENTRYPOINT ["sh", "run.sh"]
--- a/model_servers/whispercpp/src/run.sh
+++ b/model_servers/whispercpp/src/run.sh
@ -1,3 +1,3 @@
 #!/bin/bash

-./server -tr --model ${MODEL_PATH} --host ${HOST:=0.0.0.0} --port ${PORT:=8001}
+./server -tr --model ${MODEL_PATH} --convert --host ${HOST:=0.0.0.0} --port ${PORT:=8001}
--- a/models/Containerfile
+++ b/models/Containerfile
@ -1,15 +1,18 @@
 # Suggested alternative open AI Models
+# 	    https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf (Default)
+#	    https://huggingface.co/instructlab/merlinite-7b-lab-GGUF/resolve/main/merlinite-7b-lab-Q4_K_M.gguf
 # 	    https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGUF/resolve/main/llama-2-7b-chat.Q5_K_S.gguf
-#	    https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf (Default)
+#	    https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf
 #	    https://huggingface.co/TheBloke/CodeLlama-7B-Instruct-GGUF/resolve/main/codellama-7b-instruct.Q4_K_M.gguf
 #	    https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin
-# podman build --build-arg MODEL_URL=https://... -t quay.io/yourimage .
+# podman build --build-arg="MODEL_URL=https://..." -t quay.io/yourimage .
 #
-FROM registry.access.redhat.com/ubi9/ubi-micro:9.3-15
+FROM registry.access.redhat.com/ubi9/ubi-micro:9.4-15

 # Can be substituted using the --build-arg defined above
-ARG MODEL=https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf
+ARG MODEL_URL=https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf

 # By default the Model Server container image uses the AI Model stored in the model/model.file file.
 WORKDIR /model
-ADD $MODEL /model/model.file
+
+ADD $MODEL_URL /model/model.file
--- a/models/Makefile
+++ b/models/Makefile
@ -1,18 +1,51 @@
-MODEL_URL ?= https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf
-MODEL_NAME ?= mistral-7b-instruct-v0.1.Q4_K_M.gguf
+CONTAINER_TOOL ?= podman
+MODEL_URL ?= https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf
+MODEL_NAME ?= granite-7b-lab-Q4_K_M.gguf

 REGISTRY ?= quay.io
 REGISTRY_ORG ?= ai-lab
 COMPONENT = models

-IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/$(COMPONENT)/llama:latest
+IMAGE ?= $(shell tr '[:upper:]' '[:lower:]' <<< $(REGISTRY)/$(REGISTRY_ORG)/$(MODEL_NAME):latest)

 .PHONY: build
 build:
-	podman build $${MODEL_URL:+--build-arg MODEL=$${MODEL_URL}}  -f Containerfile -t ${IMAGE} .
+	"${CONTAINER_TOOL}"  build $(MODEL_URL:%=--build-arg MODEL_URL=%) -f Containerfile -t ${IMAGE} .

 .PHONY: download-model
 download-model:
-	curl -H "Cache-Control: no-cache" -s -S -L -f $(MODEL_URL) -z $(MODEL_NAME) -o $(MODEL_NAME).tmp && \
+	curl -H "Cache-Control: no-cache" --max-time 900 --retry 2 --retry-delay 15 --connect-timeout 180 --progress-bar -S -L -f $(MODEL_URL) -z $(MODEL_NAME) -o $(MODEL_NAME).tmp && \
 	mv -f $(MODEL_NAME).tmp $(MODEL_NAME) 2>/dev/null || \
 	rm -f $(MODEL_NAME).tmp $(MODEL_NAME)
+
+.PHONY: download-model-granite
+download-model-granite:
+	$(MAKE) MODEL_URL=https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf MODEL_NAME=granite-7b-lab-Q4_K_M.gguf download-model
+
+.PHONY: download-model-merlinite
+download-model-merlinite:
+	$(MAKE) MODEL_URL=https://huggingface.co/instructlab/merlinite-7b-lab-GGUF/resolve/main/merlinite-7b-lab-Q4_K_M.gguf MODEL_NAME=merlinite-7b-lab-Q4_K_M.gguf download-model
+
+.PHONY: download-model-whisper-small
+download-model-whisper-small:
+	$(MAKE) MODEL_NAME=ggml-small.bin MODEL_URL=https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-small.bin download-model
+
+.PHONY: download-model-mistral
+download-model-mistral:
+	$(MAKE) MODEL_NAME=mistral-7b-instruct-v0.2.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf download-model
+
+.PHONY: download-model-mistral-code
+download-model-mistral-code:
+	$(MAKE) MODEL_NAME=mistral-7b-code-16k-qlora.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Code-16K-qlora-GGUF/resolve/main/mistral-7b-code-16k-qlora.Q4_K_M.gguf download-model
+
+.PHONY: download-model-facebook-detr-resnet-101
+download-model-facebook-detr-resnet-101:
+	python3 -m pip install -r ../convert_models/requirements.txt
+	cd ../convert_models/ && \
+	python3 download_huggingface.py -m facebook/detr-resnet-101
+	cp -r ../convert_models/converted_models/facebook ./
+
+.PHONY: clean
+clean:
+	-rm -f *tmp
+	-rm -f mistral* ggml-* granite* merlinite*
--- a/models/README.md
+++ b/models/README.md
@ -2,18 +2,18 @@

 The models directory stores models and provides automation around downloading models.

-Want to try one of our tested models? Try or or all of the following:
+Want to try one of our tested models? Try one or all of the following:

 ```bash
-make -f Makefile download-model-llama
-make -f Makefile download-model-tiny-llama
-make -f Makefile download-model-mistral
-make -f Makefile download-model-whisper-small
-make -f Makefile download-model-whisper-base
+make download-model-granite
+make download-model-merlinite
+make download-model-mistral
+make download-model-mistral-code
+make download-model-whisper-small
 ```

-Want to download and run a model you dont see listed? This is supported with the `MODEL_NAME` and `MODEL_URL` params:
+Want to download and run a model you don't see listed? This is supported with the `MODEL_NAME` and `MODEL_URL` params:

 ```bash
-make -f Makefile download-model MODEL_URL=https://huggingface.co/andrewcanis/c4ai-command-r-v01-GGUF/resolve/main/c4ai-command-r-v01-Q4_K_S.gguf MODEL_NAME=c4ai-command-r-v01-Q4_K_S.gguf
-```
+make download-model MODEL_URL=https://huggingface.co/TheBloke/openchat-3.5-0106-GGUF/resolve/main/openchat-3.5-0106.Q4_K_M.gguf MODEL_NAME=openchat-3.5-0106.Q4_K_M.gguf
+```
--- a/models/download_hf_models.py
+++ b/models/download_hf_models.py
@ -0,0 +1,44 @@
+from huggingface_hub import snapshot_download, hf_hub_download ,HfFileSystem
+import argparse
+
+parser = argparse.ArgumentParser()
+parser.add_argument("-m", "--model")
+parser.add_argument("-o", "--output", default="./models")
+parser.add_argument("-q", "--quantization", default="Q4_K_M")
+args = parser.parse_args()
+
+gguf = False
+safetensor = False
+ignore_patterns = ["*.md", ".gitattributes"]
+
+fs = HfFileSystem()
+files = fs.ls(args.model, detail=False)
+
+for f in files:
+    if ".gguf" in f:
+        gguf = True
+        break
+    if ".safetensor" in f:
+        safetensor = True
+        break
+
+if gguf:
+    file_name = [x for x in files if args.quantization in x][0]
+    file_name_parts = file_name.split("/")
+    local_dir = f"{args.output}/{file_name_parts[1]}"
+    hf_hub_download(repo_id=f"{file_name_parts[0]}/{file_name_parts[1]}", 
+                    filename=file_name_parts[2],
+                    local_dir=local_dir,
+                    local_dir_use_symlinks=False
+                    )
+else:
+    if  safetensor:
+        ignore_patterns.append("*.bin")
+    
+    file_name_parts = args.model.split("/")
+    local_dir = f"{args.output}/{file_name_parts[1]}"
+    snapshot_download(repo_id=args.model,
+                      local_dir=local_dir,
+                      local_dir_use_symlinks=False,
+                      ignore_patterns=ignore_patterns,
+                      )
--- a/recipes/audio/audio_to_text/Makefile
+++ b/recipes/audio/audio_to_text/Makefile
@ -0,0 +1,9 @@
+SHELL := /bin/bash
+APP ?= audio-to-text
+PORT ?= 8501
+
+include ../../common/Makefile.common
+
+RECIPE_BINARIES_PATH := $(shell realpath ../../common/bin)
+RELATIVE_MODELS_PATH := ../../../models
+RELATIVE_TESTS_PATH := ../tests
--- a/recipes/audio/audio_to_text/ai-lab.yaml
+++ b/recipes/audio/audio_to_text/ai-lab.yaml
@ -1,15 +1,15 @@
 version: v1.0
 application:
  type: audio
-  name: Audio Transcription 
-  description: This is a Streamlit transcription application. 
+  name: Audio Transcription
+  description: Transcribe audio files via speech recognition.
  containers:
    - name: whispercpp-server
      contextdir: ../../../model_servers/whispercpp
      containerfile: ./base/Containerfile
      model-service: true
-      backend: 
-        - llama
+      backend:
+        - whisper-cpp
      arch:
        - arm64
        - amd64
--- a/recipes/audio/audio_to_text/app/Containerfile
+++ b/recipes/audio/audio_to_text/app/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY requirements.txt /locallm/requirements.txt
 RUN pip install --upgrade pip && \
--- a/recipes/audio/audio_to_text/app/whisper_client.py
+++ b/recipes/audio/audio_to_text/app/whisper_client.py
@ -8,15 +8,19 @@ st.title(":studio_microphone: Speech Recognition")
 st.markdown("Upload an audio file you wish to have translated")
 endpoint = os.getenv("MODEL_ENDPOINT", default="http://0.0.0.0:8001")
 endpoint = f"{endpoint}/inference"
-audio = st.file_uploader("", type=["wav"], accept_multiple_files=False)
+endpoint_bearer = os.getenv("MODEL_ENDPOINT_BEARER")
+request_kwargs = {}
+if endpoint_bearer is not None:
+    request_kwargs["headers"] = {"Authorization": f"Bearer {endpoint_bearer}"}
+audio = st.file_uploader("", type=["wav","mp3","mp4","flac"], accept_multiple_files=False)
 # read audio file
 if audio:
    audio_bytes = audio.read()
    st.audio(audio_bytes, format='audio/wav', start_time=0)
-    files = {'file': audio_bytes}
-    response = requests.post(endpoint, files=files)
+    request_kwargs["files"] = {'file': audio_bytes}
+    response = requests.post(endpoint, **request_kwargs)
    response_json = response.json()
    st.subheader(f"Translated Text")
    st.text_area(label="", value=response_json['text'], height=300)
 else:
-    st.write("Input not provided")
+    st.write("Input not provided")
--- a/recipes/audio/audio_to_text/bootc/Containerfile
+++ b/recipes/audio/audio_to_text/bootc/Containerfile
@ -0,0 +1,47 @@
+# Example: an AI powered sample application is embedded as a systemd service
+# via Podman quadlet files in /usr/share/containers/systemd
+#
+# from recipes/natural_language_processing/audio-to-text, run
+# 'make bootc'
+
+FROM quay.io/centos-bootc/centos-bootc:stream9
+ARG SSHPUBKEY
+
+# The --build-arg "SSHPUBKEY=$(cat ~/.ssh/id_rsa.pub)" option inserts your
+# public key into the image, allowing root access via ssh.
+RUN set -eu; mkdir -p /usr/ssh && \
+    echo 'AuthorizedKeysFile /usr/ssh/%u.keys .ssh/authorized_keys .ssh/authorized_keys2' >> /etc/ssh/sshd_config.d/30-auth-system.conf && \
+    echo ${SSHPUBKEY} > /usr/ssh/root.keys && chmod 0600 /usr/ssh/root.keys
+
+ARG RECIPE=audio-to-text
+ARG MODEL_IMAGE=quay.io/ai-lab/whisper-small:latest
+ARG APP_IMAGE=quay.io/ai-lab/${RECIPE}:latest
+ARG SERVER_IMAGE=quay.io/ai-lab/whispercpp:latest
+ARG TARGETARCH
+
+# Add quadlet files to setup system to automatically run AI application on boot
+COPY build/${RECIPE}.kube build/${RECIPE}.yaml /usr/share/containers/systemd
+
+# Because images are prepulled, no need for .image quadlet
+# If commenting out the pulls below, uncomment this to track the images
+# so the systemd service will wait for the images with the service startup
+# COPY build/${RECIPE}.image /usr/share/containers/systemd
+
+# Added for running as an OCI Container to prevent Overlay on Overlay issues.
+VOLUME /var/lib/containers
+
+# Setup /usr/lib/containers/storage as an additional store for images.
+# Remove once the base images have this set by default.
+RUN sed -i -e '/additionalimage.*/a "/usr/lib/containers/storage",' \
+        /etc/containers/storage.conf && \
+	mkdir -p /usr/lib/containers/storage
+
+# Prepull the model, model_server & application images to populate the system.
+# Use the Containerfile.nocache Containerfile to keep bootc image smaller.
+RUN skopeo --debug copy --override-arch=${TARGETARCH} docker://${APP_IMAGE} containers-storage:[overlay@/usr/lib/containers/storage+/run/containers/storage]${APP_IMAGE}
+RUN echo ${APP_IMAGE}; skopeo copy --override-arch=${TARGETARCH} docker://${SERVER_IMAGE} containers-storage:[overlay@/usr/lib/containers/storage+/run/containers/storage]${SERVER_IMAGE}
+RUN skopeo copy --override-arch=${TARGETARCH} docker://${Model_IMAGE} containers-storage:[overlay@/usr/lib/containers/storage+/run/containers/storage]${MODEL_IMAGE}
+
+RUN podman system reset --force 2>/dev/null
+
+EXPOSE 8501
--- a/recipes/audio/audio_to_text/bootc/Containerfile.nocache
+++ b/recipes/audio/audio_to_text/bootc/Containerfile.nocache
@ -0,0 +1,24 @@
+# Example: an AI powered sample application is embedded as a systemd service
+# via Podman quadlet files in /usr/share/containers/systemd
+#
+# from recipes/natural_language_processing/audio-to-text, run
+# 'make bootc'
+
+FROM quay.io/centos-bootc/centos-bootc:stream9
+ARG SSHPUBKEY
+
+# The --build-arg "SSHPUBKEY=$(cat ~/.ssh/id_rsa.pub)" option inserts your
+# public key into the image, allowing root access via ssh.
+RUN set -eu; mkdir -p /usr/ssh && \
+    echo 'AuthorizedKeysFile /usr/ssh/%u.keys .ssh/authorized_keys .ssh/authorized_keys2' >> /etc/ssh/sshd_config.d/30-auth-system.conf && \
+    echo ${SSHPUBKEY} > /usr/ssh/root.keys && chmod 0600 /usr/ssh/root.keys
+
+ARG RECIPE=audio-to-text
+
+# Add quadlet files to setup system to automatically run AI application on boot
+COPY build/${RECIPE}.image build/${RECIPE}.kube build/${RECIPE}.yaml /usr/share/containers/systemd
+
+# Added for running as an OCI Container to prevent Overlay on Overlay issues.
+VOLUME /var/lib/containers
+
+EXPOSE 8501
--- a/recipes/audio/audio_to_text/bootc/README.md
+++ b/recipes/audio/audio_to_text/bootc/README.md
@ -0,0 +1,94 @@
+## Embed workload (AI sample applications) in a bootable container image
+
+### Create a custom centos-bootc:stream9 image
+
+* [Containerfile](./Containerfile) - embeds an LLM-powered sample chat application.
+
+Details on the application can be found [in the audio-to-text/README.md](../README.md). By default, this Containerfile includes a model-server
+that is meant to run with CPU - no additional GPU drivers or toolkits are embedded. You can substitute the llamacpp_python model-server image
+for one that has GPU drivers and toolkits with additional build-args. The `FROM` must be replaced with a base image that has the necessary
+kernel drivers and toolkits if building for GPU enabled systems. For an example of an NVIDIA/CUDA base image,
+see [NVIDIA bootable image example](https://gitlab.com/bootc-org/examples/-/tree/main/nvidia?ref_type=heads)
+
+In order to pre-pull the workload images, you need to build from the same architecture you're building for.
+If not pre-pulling the workload images, you can cross build (ie, build from a Mac for an X86_64 system).
+To build the derived bootc image for x86_64 architecture, run the following:
+
+```bash
+cd recipes/natural_language_processing/audio-to-text
+
+# for CPU powered sample LLM application
+# to switch to an alternate platform like aarch64, pass --platform linux/arm64
+# the --cap-add SYS_ADMIN switch is needed when you are embedding Podman
+# commands within the container build. If the registry you are pulling images
+# from requires authentication, then you will need to volume mount the
+# auth_json file with SELinux separation disabled.
+podman login --auth-file auth.json quay.io/yourrepo
+podman build --build-arg "sshpubkey=$(cat ~/.ssh/id_rsa.pub)" \
+           --security-opt label=disable \
+	   -v ./auth.json:/run/containers/0/auth.json \
+	   --cap-add SYS_ADMIN \
+	   -t quay.io/yourrepo/youros:tag .
+
+# for GPU powered sample LLM application with llamacpp cuda model server
+podman build --build-arg "sshpubkey=$(cat ~/.ssh/id_rsa.pub)" \
+           --build-arg "model-server-image="quay.io/ai-lab/llamacpp_python_cuda:latest" \
+           --from <YOUR BOOTABLE IMAGE WITH NVIDIA/CUDA> \
+           --cap-add SYS_ADMIN \
+           --platform linux/amd64 \
+           -t quay.io/yourrepo/youros:tag .
+
+podman push quay.io/yourrepo/youros:tag
+```
+
+### Update a bootc-enabled system with the new derived image
+
+To build a disk image from an OCI bootable image, you can refer to [bootc-org/examples](https://gitlab.com/bootc-org/examples).
+For this example, we will assume a bootc enabled system is already running.
+If already running a bootc-enabled OS, `bootc switch` can be used to update the system to target a new bootable OCI image with embedded workloads.
+
+SSH into the bootc-enabled system and run:
+
+```bash
+bootc switch quay.io/yourrepo/youros:tag
+```
+
+The necessary image layers will be downloaded from the OCI registry, and the system will prompt you to reboot into the new operating system.
+From this point, with any subsequent modifications and pushes to the `quay.io/yourrepo/youreos:tag` OCI image, your OS can be updated with:
+
+```bash
+bootc upgrade
+```
+
+### Accessing the embedded workloads
+
+The audio-to-text can be accessed by visiting port `8150` of the running bootc system.
+They will be running as systemd services from Podman quadlet files placed at `/usr/share/containers/systemd/` on the bootc system.
+For more information about running containerized applications as systemd services with Podman, refer to this
+[Podman quadlet post](https://www.redhat.com/sysadmin/quadlet-podman) or, [podman documentation](https://podman.io/docs)
+
+To monitor the sample applications, SSH into the bootc system and run either:
+
+```bash
+systemctl status audio-to-text
+```
+
+You can also view the pods and containers that are managed with systemd by running:
+
+```
+podman pod list
+podman ps -a
+```
+
+To stop the sample applications, SSH into the bootc system and run:
+
+```bash
+systemctl stop audio-to-text
+```
+
+To run the sample application _not_ as a systemd service, stop the services then
+run the appropriate commands based on the application you have embedded.
+
+```bash
+podman kube play /usr/share/containers/systemd/audio-to-text.yaml
+```
--- a/recipes/audio/audio_to_text/quadlet/README.md
+++ b/recipes/audio/audio_to_text/quadlet/README.md
@ -1,4 +1,4 @@
-### Run audio-text locally as a podman pod
+### Run audio-to-text as a systemd service

 There are pre-built images and a pod definition to run this audio-to-text example application.
 This sample converts an audio waveform (.wav) file to text.
@ -6,7 +6,7 @@ This sample converts an audio waveform (.wav) file to text.
 To run locally, 

 ```bash
-podman kube play ./quadlet/audio-to-text.yaml
+podman kube play ./build/audio-to-text.yaml
 ```
 To monitor locally,

@ -18,13 +18,12 @@ podman logs <name of container from the above>

 The application should be accessible at `http://localhost:8501`. It will take a few minutes for the model to load.

-### Run audio-text as a systemd service
+### Run audio-to-text as a systemd service

 ```bash
-cp audio-text.yaml /etc/containers/systemd/audio-text.yaml
-cp audio-text.kube.example /etc/containers/audio-text.kube
-cp audio-text.image /etc/containers/audio-text.image
+(cd ../;make quadlet)
+sudo cp ../build/audio-to-text.yaml ../build/audio-to-text.kube ../build/audio-to-text.image /usr/share/containers/systemd/
 /usr/libexec/podman/quadlet --dryrun (optional)
 systemctl daemon-reload
-systemctl start audio-text
+systemctl start audio-to-text
 ```
--- a/recipes/audio/audio_to_text/quadlet/audio-text.image
+++ b/recipes/audio/audio_to_text/quadlet/audio-text.image
@ -1,7 +0,0 @@
-[Install]
-WantedBy=audio-text.service
-
-[Image]
-Image=quay.io/redhat-et/locallm-whisper-ggml-small:latest
-Image=quay.io/redhat-et/locallm-whisper-service:latest
-Image=quay.io/redhat-et/locallm-audio-to-text:latest
--- a/recipes/audio/audio_to_text/quadlet/audio-to-text.image
+++ b/recipes/audio/audio_to_text/quadlet/audio-to-text.image
@ -0,0 +1,7 @@
+[Install]
+WantedBy=audio-to-text.service
+
+[Image]
+Image=APP_IMAGE
+Image=MODEL_IMAGE
+Image=SERVER_IMAGE
--- a/recipes/audio/audio_to_text/quadlet/audio-text.kube.example
+++ b/recipes/audio/audio_to_text/quadlet/audio-text.kube.example
@ -7,7 +7,7 @@ RequiresMountsFor=%t/containers

 [Kube]
 # Point to the yaml file in the same directory
-Yaml=audio-text.yaml
+Yaml=audio-to-text.yaml

 [Service]
 Restart=always
--- a/recipes/audio/audio_to_text/quadlet/audio-to-text.yaml
+++ b/recipes/audio/audio_to_text/quadlet/audio-to-text.yaml
@ -7,7 +7,7 @@ metadata:
 spec:
  initContainers:
  - name: model-file
-    image: quay.io/redhat-et/locallm-whisper-ggml-small:latest
+    image: MODEL_IMAGE
    command: ['/usr/bin/install', "/model/ggml-small.bin", "/shared/"]
    volumeMounts:
    - name: model-file
@ -16,7 +16,7 @@ spec:
  - env:
    - name: MODEL_ENDPOINT
      value: http://0.0.0.0:8001
-    image: quay.io/redhat-et/locallm-audio-to-text:latest
+    image: APP_IMAGE
    name: audio-to-text
    ports:
    - containerPort: 8501
@ -29,8 +29,8 @@ spec:
    - name: PORT
      value: 8001
    - name: MODEL_PATH
-      value: /model/ggml-small.bin
-    image: quay.io/redhat-et/locallm-whisper-service:latest
+      value: /model/model.file
+    image: SERVER_IMAGE
    name: whisper-model-service
    ports:
    - containerPort: 8001
--- a/recipes/common/Makefile.common
+++ b/recipes/common/Makefile.common
@ -4,16 +4,20 @@ REGISTRY_ORG ?= ai-lab
 IMAGE_NAME ?= $(REGISTRY_ORG)/${APP}:latest
 APP_IMAGE ?= $(REGISTRY)/$(IMAGE_NAME)
 CHROMADB_IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/chromadb:latest
-MODEL_IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/mistral-7b-instruct:latest
-SERVER_IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/llamacpp-python:latest
+MODEL_IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/granite-7b-lab:latest
+SERVER_IMAGE ?= $(REGISTRY)/$(REGISTRY_ORG)/llamacpp_python:latest
 SSH_PUBKEY ?= $(shell cat ${HOME}/.ssh/id_rsa.pub;)
 BOOTC_IMAGE ?= quay.io/$(REGISTRY_ORG)/${APP}-bootc:latest
 BOOTC_IMAGE_BUILDER ?= quay.io/centos-bootc/bootc-image-builder
 DISK_TYPE ?= qcow2
+DISK_UID ?= $(shell id -u)
+DISK_GID ?= $(shell id -g)
 FROM ?=
 ARCH ?=
+BUILD_ARG_FILE ?=
 CONTAINERFILE ?= Containerfile
 GRAPH_ROOT=$(shell podman info --format '{{ .Store.GraphRoot }}')
+UMASK=$(shell umask)

 ROOTLESS_AUTH_JSON=${XDG_RUNTIME_DIR}/containers/auth.json
 ROOTFUL_AUTH_JSON=/run/containers/0/auth.json
@ -21,11 +25,11 @@ NONLINUX_AUTH_JSON=${HOME}/.config/containers/auth.json
 AUTH_JSON ?=

 ifneq ("$(wildcard $(NONLINUX_AUTH_JSON))","")
-	AUTH_JSON=$(NONINUX_AUTH_JSON);
+	AUTH_JSON=$(NONLINUX_AUTH_JSON)
 else ifneq ("$(wildcard $(ROOTLESS_AUTH_JSON))","")
-	AUTH_JSON=$(ROOTLESS_AUTH_JSON);
+	AUTH_JSON=$(ROOTLESS_AUTH_JSON)
 else ifneq ("$(wildcard $(ROOTFUL_AUTH_JSON))","")
-	AUTH_JSON=$(ROOTFUL_AUTH_JSON);
+	AUTH_JSON=$(ROOTFUL_AUTH_JSON)
 endif

 CHROMEDRIVER_VERSION := 103.0.5060.53
@ -36,6 +40,9 @@ CHROME_DOWNLOAD_PATH ?=

 OS := $(shell uname -s)
 ARCH := $(shell uname -m)
+ifeq ($(ARCH),x86_64)
+	ARCH := amd64
+endif

 ifeq ($(OS),Darwin) # This structure may vary if we upgrade chromedriver, see index: https://chromedriver.storage.googleapis.com/index.html
 	ifeq ($(ARCH),amd64)
@ -46,7 +53,7 @@ ifeq ($(OS),Darwin) # This structure may vary if we upgrade chromedriver, see in
 	CHROME_DOWNLOAD_PATH := googlechrome.dmg
 else ifeq ($(OS),Linux)
 	CHROMEDRIVER_DOWNLOAD_PATH := chromedriver_linux64.zip
-	CHROME_DOWNLOAD_PATH := google-chrome-stable_current_amd64.deb
+	CHROME_DOWNLOAD_PATH := google-chrome-stable_current_$(ARCH).deb
 endif

 CHROME_MIRROR := https://www.slimjet.com/chrome/files/$(CHROMEDRIVER_VERSION)/$(CHROME_DOWNLOAD_PATH)
@ -57,15 +64,10 @@ UNZIP_EXISTS ?= $(shell command -v unzip)
 RELATIVE_MODELS_PATH := ?=
 RELATIVE_TESTS_PATH := ?=

-MISTRAL_MODEL_NAME := mistral-7b-instruct-v0.1.Q4_K_M.gguf
-MISTRAL_MODEL_URL := https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf
+GRANITE_MODEL_NAME := granite-7b-lab-Q4_K_M.gguf
+GRANITE_MODEL_URL := https://huggingface.co/instructlab/granite-7b-lab-GGUF/resolve/main/granite-7b-lab-Q4_K_M.gguf

-MODEL_NAME ?= $(MISTRAL_MODEL_NAME)
-
-.PHONY: download-model-mistral
-download-model-mistral:
-	cd ../../../models && \
-	make MODEL_NAME=mistral-7b-instruct-v0.1.Q4_K_M.gguf MODEL_URL=https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf -f  Makefile download-model
+MODEL_NAME ?= $(GRANITE_MODEL_NAME)

 .PHONY: install
 install::
@ -75,21 +77,24 @@ install::

 .PHONY: build
 build:
-	podman build --squash-all $${ARCH:+--platform linux/$${ARCH}} $${FROM:+--from $${FROM}} -t ${APP_IMAGE} app/
+	podman build --squash-all \
+	       $(ARCH:%=--platform linux/%) \
+	       $(BUILD_ARG_FILE:%=--build-arg-file=%) \
+	       $(FROM:%=--from %) -t ${APP_IMAGE} app/

 .PHONY: bootc
-bootc: quadlet
+bootc: quadlet growfs
 	podman build \
-	  $${ARCH:+--arch $${ARCH}} \
-	  $${FROM:+--from $${FROM}} \
-	  $${AUTH_JSON:+-v $${AUTH_JSON}:/run/containers/0/auth.json} \
+	  $(ARCH:%=--arch %) \
+	  $(BUILD_ARG_FILE:%=--build-arg-file=%) \
+	  $(FROM:%=--from %) \
+	  $(AUTH_JSON:%=-v %:/run/containers/0/auth.json) \
 	  --security-opt label=disable \
 	  --cap-add SYS_ADMIN \
 	  --build-arg MODEL_IMAGE=$(MODEL_IMAGE) \
 	  --build-arg APP_IMAGE=$(APP_IMAGE) \
 	  --build-arg SERVER_IMAGE=$(SERVER_IMAGE) \
 	  --build-arg "SSHPUBKEY=$(SSH_PUBKEY)" \
-	  -v /etc/containers/policy.json:/etc/containers/policy.json \
 	  -f bootc/$(CONTAINERFILE) \
 	  -t ${BOOTC_IMAGE} bootc
 	@echo ""
@ -102,26 +107,31 @@ bootc: quadlet
 .PHONY: bootc-run
 bootc-run:
 	podman run -d --rm --name $(APP)-bootc -p 8080:8501 --privileged \
-	  $${AUTH_JSON:+-v $${AUTH_JSON}:/run/containers/0/auth.json} \
+	  $(AUTH_JSON:%=-v %:/run/containers/0/auth.json) \
 	  $(BOOTC_IMAGE) /sbin/init

 .PHONY: bootc-image-builder
-bootc-image-builder: bootc
+bootc-image-builder:
+	@if podman image exists $(BOOTC_IMAGE); then \
+		echo "$(BOOTC_IMAGE) exists in local storage, using it"; \
+	else \
+		$(MAKE) bootc; \
+	fi
 	mkdir -p build/store
 	podman run \
 	  --rm \
 	  -ti \
 	  -v $(GRAPH_ROOT):/var/lib/containers/storage \
-	  $${ARCH:+--arch $${ARCH}} \
-	  $${AUTH_JSON:+-v $${AUTH_JSON}:/run/containers/0/auth.json} \
+	  $(ARCH:%=--arch %) \
+	  $(AUTH_JSON:%=-v %:/run/containers/0/auth.json) \
 	  --privileged \
 	  --pull newer \
-	  -v /etc/containers/policy.json:/etc/containers/policy.json \
 	  -v ./build:/output \
 	  -v ./build/store:/store \
 	  $(BOOTC_IMAGE_BUILDER) \
-	  $${ARCH:+--target-arch $${ARCH}} \
+	  $(ARCH:%=--target-arch %) \
 	  --type $(DISK_TYPE) \
+	  --chown $(DISK_UID):$(DISK_GID) \
 	  --local \
 	  $(BOOTC_IMAGE)

@ -129,7 +139,7 @@ bootc-image-builder: bootc
 install-chromedriver:
 	@if [[ -z "$(LOCAL_CHROMEDRIVER_EXISTS)" ]]; then \
 		if [[ -n "$(UNZIP_EXISTS)" ]]; then \
-			curl --max-time 300 --connect-timeout 60 -sLO $(CHROMEDRIVER_MIRROR)/$(CHROMEDRIVER_VERSION)/$(CHROMEDRIVER_DOWNLOAD_PATH); \
+			curl --progress-bar --max-time 3000 --connect-timeout 60 -LO $(CHROMEDRIVER_MIRROR)/$(CHROMEDRIVER_VERSION)/$(CHROMEDRIVER_DOWNLOAD_PATH); \
 			unzip $(CHROMEDRIVER_DOWNLOAD_PATH); \
 			mv chromedriver $(RECIPE_BINARIES_PATH)/; \
 			rm ./$(CHROMEDRIVER_DOWNLOAD_PATH); \
@ -141,17 +151,28 @@ install-chromedriver:

 .PHONY: install-chrome
 install-chrome:
-	curl --max-time 300 --connect-timeout 60 -sLO $(CHROME_MIRROR)
+	curl --progress-bar --max-time 3000 --connect-timeout 60 -LO $(CHROME_MIRROR)
 	@if [[ "$(OS)" == "Linux" ]]; then \
 		sudo dpkg -i $(CHROME_DOWNLOAD_PATH); \
 	elif [[ "$(OS)" == "Darwin" ]]; then \
 		open $(CHROME_DOWNLOAD_PATH); \
 		ls "/Volumes/Google Chrome/Google Chrome.app/Contents/MacOS/Google Chrome"; \
-		cp -r "/Volumes/Google Chrome/Google Chrome.app" "$(RECIPE_BINARIES_PATH)/"; \
+		cp -pr "/Volumes/Google Chrome/Google Chrome.app" "$(RECIPE_BINARIES_PATH)/"; \
 		diskutil unmount "/Volumes/Google Chrome" || true; \
 		rm $(CHROME_DOWNLOAD_PATH); \
 	fi;

+.PHONY: check-umask
+check-umask:
+	@test "$(UMASK)" = "0022" || \
+		(echo; echo -n "Error: umask $(UMASK) will cause unexpected behaviour: use umask 022! "; \
+		 echo "Verify the `ai-lab-recipes` git repository was cloned with umask 0022"; exit 1)
+
+.PHONY: growfs
+growfs: quadlet check-umask
+	# Add growfs service
+	mkdir -p build; cp -pR ../../common/usr build/
+
 .PHONY: quadlet
 quadlet:
 	# Modify quadlet files to match the server, model and app image
@ -167,7 +188,7 @@ quadlet:
 	    -e "s|MODEL_IMAGE|${MODEL_IMAGE}|g" \
 	    quadlet/${APP}.yaml \
 	    > build/${APP}.yaml
-	cp quadlet/${APP}.kube build/${APP}.kube
+	cp -p quadlet/${APP}.kube build/${APP}.kube

 .PHONY: run
 run: 
--- a/recipes/common/README.md
+++ b/recipes/common/README.md
@ -28,8 +28,10 @@ used to override defaults for a variety of make targets.
 |BOOTC_IMAGE_BUILDER | Bootc Image Builder container image 	      	    | `quay.io/centos-bootc/bootc-image-builder`	      |
 |CHROMADB_IMAGE      | ChromaDB image to be used for application      	    | `$(REGISTRY)/$(REGISTRY_ORG)/chromadb:latest`	      |
 |DISK_TYPE           | Disk type to be created by BOOTC_IMAGE_BUILDER 	    | `qcow2` (Options: ami, iso, vmdk, raw)		      |
-|MODEL_IMAGE 	     | AI Model to be used by application             	    | `$(REGISTRY)/$(REGISTRY_ORG)/mistral-7b-instruct:latest`|
-|SERVER_IMAGE 	     | AI Model Server Application                    	    | `$(REGISTRY)/$(REGISTRY_ORG)/llamacpp-python:latest`    |
+|DISK_UID            | Disk UID to be specified by BOOTC_IMAGE_BUILDER      | `$(shell id -u)`					      |
+|DISK_GID            | Disk GID to be specified by BOOTC_IMAGE_BUILDER      | `$(shell id -g)`					      |
+|MODEL_IMAGE 	     | AI Model to be used by application             	    | `$(REGISTRY)/$(REGISTRY_ORG)/granite-7b-lab:latest`|
+|SERVER_IMAGE 	     | AI Model Server Application                    	    | `$(REGISTRY)/$(REGISTRY_ORG)/llamacpp_python:latest`    |
 |SSH_PUBKEY 	     | SSH Public key preloaded in bootc image.             | `$(shell cat ${HOME}/.ssh/id_rsa.pub;)`		      |
 |FROM 		     | Overrides first FROM instruction within Containerfile| `FROM` line defined in the Containerfile		      |
 |ARCH 		     | Use alternate arch for image build                   | Current Arch					      |
@ -37,4 +39,4 @@ used to override defaults for a variety of make targets.

 Examples

-make bootc FROM=registry.redhat.io/rhel9-beta/rhel-bootc:9.4 APP_IMAGE=quay.io/myorg/chatbot-bootc
+make bootc FROM=registry.redhat.io/rhel9/rhel-bootc:9.4 APP_IMAGE=quay.io/myorg/chatbot-bootc
--- a/recipes/common/usr/lib/systemd/system/bootc-generic-growpart.service
+++ b/recipes/common/usr/lib/systemd/system/bootc-generic-growpart.service
@ -0,0 +1,20 @@
+[Unit]
+Description=Bootc Fallback Root Filesystem Grow
+Documentation=https://gitlab.com/fedora/bootc/docs
+# For now we skip bare metal cases, and we also have nothing to do
+# for containers.
+ConditionVirtualization=vm
+# This helps verify that we're running in a bootc/ostree based target.
+ConditionPathIsMountPoint=/sysroot
+# We want to run before any e.g. large container images might be pulled.
+DefaultDependencies=no
+Requires=sysinit.target
+After=sysinit.target
+Before=basic.target
+
+[Service]
+ExecStart=/usr/libexec/bootc-generic-growpart
+# So we can temporarily remount the sysroot writable
+MountFlags=slave
+# Just to auto-cleanup our temporary files
+PrivateTmp=yes
--- a/recipes/common/usr/lib/systemd/system/local-fs.target.wants/bootc-generic-growpart.service
+++ b/recipes/common/usr/lib/systemd/system/local-fs.target.wants/bootc-generic-growpart.service
@ -0,0 +1 @@
+../bootc-generic-growpart.service
--- a/recipes/common/usr/libexec/bootc-generic-growpart
+++ b/recipes/common/usr/libexec/bootc-generic-growpart
@ -0,0 +1,41 @@
+#!/bin/bash
+set -eu
+
+backing_device=$(findmnt -vno SOURCE /sysroot)
+echo "Backing device: ${backing_device}"
+syspath=/sys/class/block/$(basename "${backing_device}")
+if ! test -d "${syspath}"; then
+    echo "failed to find backing device ${syspath}"; exit 1
+fi
+
+# Handling devicemapper targets is a whole other thing
+case $backing_device in
+    /dev/mapper/*) "Not growing $backing_device"; exit 0 ;;
+esac
+
+# Note that we expect that the rootfs is on a partition
+partition=$(cat "${syspath}"/partition)
+
+# Walk up to find the parent blockdev
+parentpath=$(dirname "$(realpath "${syspath}")")
+devmajmin=$(cat "${parentpath}"/dev)
+parent="/dev/block/${devmajmin}"
+
+# Grow the partition
+tmpf=$(mktemp)
+# Ignore errors because growpart exits 1 if nothing changed;
+# we need to check the output for NOCHANGE:
+if ! /usr/bin/growpart "${parent}" "${partition}" > "${tmpf}"; then
+    cat "${tmpf}"
+    if grep -qEe '^NOCHANGE: ' "${tmpf}"; then
+        exit 0
+    fi
+    echo "growpart failed"
+    exit 1
+fi
+cat "${tmpf}"
+# Now, temporarily remount the sysroot writable in our mount namespace
+mount -o remount,rw /sysroot
+# And defer to systemd's growfs wrapper which handles dispatching on
+# the target filesystem type.
+/usr/lib/systemd/systemd-growfs /sysroot
--- a/recipes/computer_vision/object_detection/Makefile
+++ b/recipes/computer_vision/object_detection/Makefile
@ -0,0 +1,15 @@
+SHELL := /bin/bash
+APP ?= object_detection_client
+PORT ?= 8501
+MODEL_NAME ?= facebook/detr-resnet-101
+
+include ../../common/Makefile.common
+
+.PHONY: functional-tests
+functional-tests:
+	IMAGE_NAME=${IMAGE_NAME} REGISTRY=${REGISTRY} MODEL_NAME=${MODEL_NAME} pytest -vvv --driver=Chrome --driver-path=$(RECIPE_BINARIES_PATH)/chromedriver ${RELATIVE_TESTS_PATH}/functional
+
+RECIPE_BINARIES_PATH := $(shell realpath ../../common/bin)
+RELATIVE_MODELS_PATH := ../../../models
+RELATIVE_TESTS_PATH := ../tests
+
--- a/recipes/computer_vision/object_detection/README.md
+++ b/recipes/computer_vision/object_detection/README.md
@ -56,11 +56,11 @@ The local Model Service relies on a volume mount to the localhost to access the
 make run
 ```

-As stated above, by default the model service will use [`facebook/detr-resnet-101`](https://huggingface.co/facebook/detr-resnet-101). However you can use other compatabale models. Simply pass the new `MODEL_NAME` and `MODEL_PATH` to the make command. Make sure the model is downloaded and exists in the [models directory](../../../models/):
+As stated above, by default the model service will use [`facebook/detr-resnet-101`](https://huggingface.co/facebook/detr-resnet-101). However you can use other compatible models. Simply pass the new `MODEL_NAME` and `MODEL_PATH` to the make command. Make sure the model is downloaded and exists in the [models directory](../../../models/):

 ```bash
 # from path model_servers/object_detection_python from repo containers/ai-lab-recipes
-make MODEL_NAME=facebook/detr-resnet-50 MODEL_PATH=/models/facebook/detr-resnet-50 run
+make MODEL_NAME=facebook/detr-resnet-50 MODEL_PATH=/models/facebook/detr-resnet-101 run
 ```

 ## Build the AI Application
@ -81,7 +81,7 @@ This could be any appropriately hosted Model Service (running locally or in the
 The following Podman command can be used to run your AI Application:

 ```bash
-podman run -p 8501:8501 -e MODEL_ENDPOINT=http://10.88.0.1:8000/detection object_detection_client
+podman run -p 8501:8501 -e MODEL_ENDPOINT=http://10.88.0.1:8000 object_detection_client
 ```

 ### Interact with the AI Application
--- a/recipes/computer_vision/object_detection/ai-lab.yaml
+++ b/recipes/computer_vision/object_detection/ai-lab.yaml
@ -2,14 +2,14 @@ version: v1.0
 application:
  type: vision
  name: Object Detection
-  description: This is an example object detection demo
+  description: Detect and classify objects in images.
  containers:
    - name: object-detection-server
      contextdir: ../../../model_servers/object_detection_python
      containerfile: ./base/Containerfile
      model-service: true
-      backend: 
-        - torch
+      backend:
+        - pytorch
      arch:
        - arm64
        - amd64
@ -17,7 +17,7 @@ application:
        - 8000
      image: quay.io/redhat-et/locallm-object-detection-server:latest
    - name: object-detection-client
-      contextdir: ./client
+      contextdir: ./app
      containerfile: Containerfile
      arch:
        - arm64
--- a/recipes/computer_vision/object_detection/client/Containerfile
+++ b/recipes/computer_vision/object_detection/client/Containerfile
@ -1,4 +1,4 @@
-FROM registry.access.redhat.com/ubi9/python-311:1-52.1712567218
+FROM registry.access.redhat.com/ubi9/python-311:1-77.1726664316
 WORKDIR /locallm
 COPY requirements.txt /locallm/requirements.txt
 RUN pip install --upgrade pip && \
--- a/recipes/computer_vision/object_detection/client/object_detection_client.py
+++ b/recipes/computer_vision/object_detection/client/object_detection_client.py
@ -7,8 +7,11 @@ import io

 st.title("🕵️‍♀️ Object Detection")
 endpoint =os.getenv("MODEL_ENDPOINT", default = "http://0.0.0.0:8000")
+endpoint_bearer = os.getenv("MODEL_ENDPOINT_BEARER")
 headers = {"accept": "application/json",
           "Content-Type": "application/json"}
+if endpoint_bearer:
+    headers["Authorization"] = f"Bearer {endpoint_bearer}"
 image = st.file_uploader("Upload Image")
 window = st.empty()

@ -23,6 +26,8 @@ if image:
    window.image(img, use_column_width=True)  
    # convert PIL image into bytes for post request 
    bytes_io = io.BytesIO() 
+    if img.mode in ("RGBA", "P"): 
+        img = img.convert("RGB")
    img.save(bytes_io, "JPEG")
    img_bytes = bytes_io.getvalue()
    b64_image = base64.b64encode(img_bytes).decode('utf-8')
--- a/recipes/computer_vision/object_detection/app/requirements.txt
+++ b/recipes/computer_vision/object_detection/app/requirements.txt
@ -0,0 +1,40 @@
+altair==5.3.0
+attrs==23.2.0
+blinker==1.7.0
+cachetools==5.3.3
+certifi==2024.2.2
+charset-normalizer==3.3.2
+click==8.1.8
+gitdb==4.0.12
+GitPython==3.1.44
+idna==3.7
+Jinja2==3.1.6
+jsonschema==4.21.1
+jsonschema-specifications==2023.12.1
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+mdurl==0.1.2
+numpy==1.26.4
+packaging==24.0
+pandas==2.2.3
+pillow==10.3.0
+protobuf==4.25.3
+pyarrow==15.0.2
+pydeck==0.8.1b0
+Pygments==2.17.2
+python-dateutil==2.9.0.post0
+pytz==2024.1
+referencing==0.34.0
+requests==2.31.0
+rich==13.7.1
+rpds-py==0.18.1
+six==1.16.0
+smmap==5.0.2
+streamlit==1.33.0
+tenacity==8.2.3
+toml==0.10.2
+toolz==0.12.1
+tornado==6.4.2
+typing_extensions==4.11.0
+tzdata==2024.1
+urllib3==2.2.3
--- a/recipes/computer_vision/object_detection/client/requirements.txt
+++ b/recipes/computer_vision/object_detection/client/requirements.txt
@ -1,3 +0,0 @@
-streamlit
-requests
-pillow
--- a/recipes/computer_vision/tests/conftest.py
+++ b/recipes/computer_vision/tests/conftest.py
@ -0,0 +1,8 @@
+import pytest
+import os
+
+
+@pytest.fixture
+def chrome_options(chrome_options):
+    chrome_options.add_argument("--headless")
+    return chrome_options
--- a/recipes/computer_vision/tests/functional/init.py
+++ b/recipes/computer_vision/tests/functional/init.py
--- a/Show More
+++ b/Show More