Skip to content

Commit 0dd31b0

Browse files
authored
Merge pull request #2053 from containers/rag-separate-container
run RAG operations in a separate container
2 parents 30653f5 + b386758 commit 0dd31b0

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

64 files changed

+22888
-1099
lines changed

.tekton/asahi-rag/asahi-rag-pull-request.yaml

Lines changed: 0 additions & 47 deletions
This file was deleted.

.tekton/asahi-rag/asahi-rag-push.yaml

Lines changed: 0 additions & 44 deletions
This file was deleted.

.tekton/cann-rag/cann-rag-pull-request.yaml

Lines changed: 0 additions & 47 deletions
This file was deleted.

.tekton/cann-rag/cann-rag-push.yaml

Lines changed: 0 additions & 44 deletions
This file was deleted.

.tekton/cuda-rag/cuda-rag-pull-request.yaml

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,12 +28,10 @@ spec:
2828
value: 5d
2929
- name: dockerfile
3030
value: container-images/common/Containerfile.rag
31-
- name: parent-image
32-
value: quay.io/redhat-user-workloads/ramalama-tenant/cuda:on-pr-{{revision}}
3331
- name: build-args
3432
value:
35-
- PARENT=quay.io/redhat-user-workloads/ramalama-tenant/cuda:on-pr-{{revision}}
36-
- GPU=cuda
33+
- PARENT=docker.io/nvidia/cuda:12.8.1-devel-ubi9
34+
- TORCH_BACKEND=cu128
3735
pipelineRef:
3836
name: pull-request-pipeline
3937
timeouts:

.tekton/cuda-rag/cuda-rag-push.yaml

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -25,12 +25,10 @@ spec:
2525
value: quay.io/redhat-user-workloads/ramalama-tenant/cuda-rag:{{revision}}
2626
- name: dockerfile
2727
value: container-images/common/Containerfile.rag
28-
- name: parent-image
29-
value: quay.io/redhat-user-workloads/ramalama-tenant/cuda:{{revision}}
3028
- name: build-args
3129
value:
32-
- PARENT=quay.io/redhat-user-workloads/ramalama-tenant/cuda:{{revision}}
33-
- GPU=cuda
30+
- PARENT=docker.io/nvidia/cuda:12.8.1-devel-ubi9
31+
- TORCH_BACKEND=cu128
3432
pipelineRef:
3533
name: push-pipeline
3634
timeouts:

.tekton/integration/pipelines/bats-integration.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,9 +70,12 @@ spec:
7070
- name: envs
7171
value:
7272
- RAMALAMA_DEFAULT_IMAGE="$(tasks.init.results.ramalama-image)"
73+
- RAMALAMA_DEFAULT_RAG_IMAGE="$(tasks.init.results.ramalama-rag-image)"
7374
- RAMALAMA_STACK_IMAGE=$(tasks.init.results.stack-image)
7475
- >-
7576
RAMALAMA_IMAGES='{"CUDA_VISIBLE_DEVICES": "$(tasks.init.results.cuda-image)"}'
77+
- >-
78+
RAMALAMA_RAG_IMAGES='{"CUDA_VISIBLE_DEVICES": "$(tasks.init.results.cuda-rag-image)"}'
7679
taskRef:
7780
resolver: git
7881
params:

.tekton/integration/tasks/init-snapshot.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,10 +23,14 @@ spec:
2323
description: URI of the bats image included in the snapshot
2424
- name: ramalama-image
2525
description: URI of the ramalama image included in the snapshot
26+
- name: ramalama-rag-image
27+
description: URI of the ramalama-rag image included in the snapshot
2628
- name: stack-image
2729
description: URI of the llama-stack image included in the snapshot
2830
- name: cuda-image
2931
description: URI of the cuda image included in the snapshot
32+
- name: cuda-rag-image
33+
description: URI of the cuda-rag image included in the snapshot
3034
- name: TEST_OUTPUT
3135
description: Test result in json format
3236
steps:
@@ -59,10 +63,14 @@ spec:
5963
value: $(results.bats-image.path)
6064
- name: RESULTS_RAMALAMA_IMAGE_PATH
6165
value: $(results.ramalama-image.path)
66+
- name: RESULTS_RAMALAMA_RAG_IMAGE_PATH
67+
value: $(results.ramalama-rag-image.path)
6268
- name: RESULTS_STACK_IMAGE_PATH
6369
value: $(results.stack-image.path)
6470
- name: RESULTS_CUDA_IMAGE_PATH
6571
value: $(results.cuda-image.path)
72+
- name: RESULTS_CUDA_RAG_IMAGE_PATH
73+
value: $(results.cuda-rag-image.path)
6674
- name: RESULTS_TEST_OUTPUT_PATH
6775
value: $(results.TEST_OUTPUT.path)
6876
script: |
@@ -87,9 +95,13 @@ spec:
8795
echo
8896
component_image ramalama | tee "$RESULTS_RAMALAMA_IMAGE_PATH"
8997
echo
98+
component_image ramalama-rag | tee "$RESULTS_RAMALAMA_RAG_IMAGE_PATH"
99+
echo
90100
component_image llama-stack | tee "$RESULTS_STACK_IMAGE_PATH"
91101
echo
92102
component_image cuda | tee "$RESULTS_CUDA_IMAGE_PATH"
93103
echo
104+
component_image cuda-rag | tee "$RESULTS_CUDA_RAG_IMAGE_PATH"
105+
echo
94106
jq -jnc '{result: "SUCCESS", timestamp: now | todateiso8601, failures: 0, successes: 1, warnings: 0}' | tee "$RESULTS_TEST_OUTPUT_PATH"
95107
echo

.tekton/intel-gpu-rag/intel-gpu-rag-pull-request.yaml

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -31,12 +31,9 @@ spec:
3131
- linux-d160-c8xlarge/amd64
3232
- name: dockerfile
3333
value: container-images/common/Containerfile.rag
34-
- name: parent-image
35-
value: quay.io/redhat-user-workloads/ramalama-tenant/intel-gpu:on-pr-{{revision}}
3634
- name: build-args
3735
value:
38-
- PARENT=quay.io/redhat-user-workloads/ramalama-tenant/intel-gpu:on-pr-{{revision}}
39-
- GPU=cpu
36+
- TORCH_BACKEND=xpu
4037
pipelineRef:
4138
name: pull-request-pipeline
4239
timeouts:

.tekton/intel-gpu-rag/intel-gpu-rag-push.yaml

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,12 +28,9 @@ spec:
2828
- linux-d160-c8xlarge/amd64
2929
- name: dockerfile
3030
value: container-images/common/Containerfile.rag
31-
- name: parent-image
32-
value: quay.io/redhat-user-workloads/ramalama-tenant/intel-gpu:{{revision}}
3331
- name: build-args
3432
value:
35-
- PARENT=quay.io/redhat-user-workloads/ramalama-tenant/intel-gpu:{{revision}}
36-
- GPU=cpu
33+
- TORCH_BACKEND=xpu
3734
pipelineRef:
3835
name: push-pipeline
3936
timeouts:

0 commit comments

Comments
 (0)