Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
9950f6f
Initial version of MinIO event based dataprep for Milvus
dilverse Oct 28, 2024
7d76da5
Merge branch 'opea-project:main' into main
dilverse Oct 28, 2024
a299782
Initial version of MinIO event based dataprep for Milvus
dilverse Nov 1, 2024
2d1a561
Update to latest MinIO Image
dilverse Nov 2, 2024
92e99c6
Add LnaceDB and MinIO event based dataprep support
dilverse Nov 2, 2024
d6a5a7e
Add MinIO utils file that parses event notifications from MinIO
dilverse Nov 2, 2024
e497710
Merge branch 'opea-project:main' into main
dilverse Nov 2, 2024
2b13f5d
Update README.md files
dilverse Nov 3, 2024
78064a8
Add MinIO LanceDB retriever support
dilverse Nov 3, 2024
eb8897d
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Nov 3, 2024
616dc63
Fix README.md paths
dilverse Nov 3, 2024
c05bdcb
Fix README.md for Milvus to right path
dilverse Nov 3, 2024
a65d3dc
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Nov 3, 2024
80fe8f6
Fix connection arguments for Milvus
dilverse Nov 3, 2024
33d38f4
Remove local file volumes from docker compose
dilverse Nov 3, 2024
e83f649
Merge branch 'main' into main
mkbhanda Nov 5, 2024
c4dfea3
Update comps/dataprep/minio/lancedb/langchain/README.md
dilverse Nov 6, 2024
263aac3
Update comps/dataprep/minio/lancedb/langchain/README.md
dilverse Nov 6, 2024
5238a85
Update comps/dataprep/minio/lancedb/langchain/README.md
dilverse Nov 6, 2024
d6142a8
Update comps/dataprep/minio/lancedb/langchain/README.md
dilverse Nov 6, 2024
b66221e
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
491cdcd
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
94581a7
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
535d09a
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
e726c57
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
fefd9ec
Update comps/dataprep/minio/milvus/langchain/README.md
dilverse Nov 6, 2024
1efea4d
Remove unused code and add appropriate copyrights and minor lint fixex
dilverse Nov 6, 2024
2952611
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Nov 6, 2024
30976f1
Merge branch 'main' into main
dilverse Nov 6, 2024
7c41fc5
Merge branch 'main' into main
lvliang-intel Nov 12, 2024
ce2c768
Merge branch 'main' into main
dilverse Dec 27, 2024
ac5413f
Added new docker files to github workflow
dilverse Dec 27, 2024
fba854a
Add new lines to the workflows
dilverse Dec 27, 2024
d526d28
Remove trailing spaces
dilverse Dec 27, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
120 changes: 64 additions & 56 deletions .github/workflows/docker/compose/dataprep-compose.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,59 +3,67 @@

# this file should be run in the root of the repo
services:
dataprep-redis:
build:
dockerfile: comps/dataprep/redis/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-redis:${TAG:-latest}
dataprep-qdrant:
build:
dockerfile: comps/dataprep/qdrant/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-qdrant:${TAG:-latest}
dataprep-on-ray-redis:
build:
dockerfile: comps/dataprep/redis/langchain_ray/Dockerfile
image: ${REGISTRY:-opea}/dataprep-on-ray-redis:${TAG:-latest}
dataprep-multimodal-vdms:
build:
dockerfile: comps/dataprep/vdms/multimodal_langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-multimodal-vdms:${TAG:-latest}
dataprep-multimodal-redis:
build:
dockerfile: comps/dataprep/multimodal/redis/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-multimodal-redis:${TAG:-latest}
dataprep-redis-llama-index:
build:
dockerfile: comps/dataprep/redis/llama_index/Dockerfile
image: ${REGISTRY:-opea}/dataprep-redis-llama-index:${TAG:-latest}
dataprep-milvus:
build:
dockerfile: comps/dataprep/milvus/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-milvus:${TAG:-latest}
dataprep-pgvector:
build:
dockerfile: comps/dataprep/pgvector/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-pgvector:${TAG:-latest}
dataprep-pinecone:
build:
dockerfile: comps/dataprep/pinecone/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-pinecone:${TAG:-latest}
dataprep-vdms:
build:
dockerfile: comps/dataprep/vdms/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-vdms:${TAG:-latest}
dataprep-neo4j:
build:
dockerfile: comps/dataprep/neo4j/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-neo4j:${TAG:-latest}
dataprep-neo4j-llamaindex:
build:
dockerfile: comps/dataprep/neo4j/llama_index/Dockerfile
image: ${REGISTRY:-opea}/dataprep-neo4j-llamaindex:${TAG:-latest}
dataprep-elasticsearch:
build:
dockerfile: comps/dataprep/elasticsearch/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-elasticsearch:${TAG:-latest}
dataprep-opensearch:
build:
dockerfile: comps/dataprep/opensearch/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-opensearch:${TAG:-latest}
dataprep-redis:
build:
dockerfile: comps/dataprep/redis/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-redis:${TAG:-latest}
dataprep-qdrant:
build:
dockerfile: comps/dataprep/qdrant/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-qdrant:${TAG:-latest}
dataprep-on-ray-redis:
build:
dockerfile: comps/dataprep/redis/langchain_ray/Dockerfile
image: ${REGISTRY:-opea}/dataprep-on-ray-redis:${TAG:-latest}
dataprep-multimodal-vdms:
build:
dockerfile: comps/dataprep/vdms/multimodal_langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-multimodal-vdms:${TAG:-latest}
dataprep-multimodal-redis:
build:
dockerfile: comps/dataprep/multimodal/redis/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-multimodal-redis:${TAG:-latest}
dataprep-redis-llama-index:
build:
dockerfile: comps/dataprep/redis/llama_index/Dockerfile
image: ${REGISTRY:-opea}/dataprep-redis-llama-index:${TAG:-latest}
dataprep-milvus:
build:
dockerfile: comps/dataprep/milvus/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-milvus:${TAG:-latest}
dataprep-pgvector:
build:
dockerfile: comps/dataprep/pgvector/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-pgvector:${TAG:-latest}
dataprep-pinecone:
build:
dockerfile: comps/dataprep/pinecone/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-pinecone:${TAG:-latest}
dataprep-vdms:
build:
dockerfile: comps/dataprep/vdms/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-vdms:${TAG:-latest}
dataprep-neo4j:
build:
dockerfile: comps/dataprep/neo4j/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-neo4j:${TAG:-latest}
dataprep-neo4j-llamaindex:
build:
dockerfile: comps/dataprep/neo4j/llama_index/Dockerfile
image: ${REGISTRY:-opea}/dataprep-neo4j-llamaindex:${TAG:-latest}
dataprep-elasticsearch:
build:
dockerfile: comps/dataprep/elasticsearch/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-elasticsearch:${TAG:-latest}
dataprep-opensearch:
build:
dockerfile: comps/dataprep/opensearch/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-opensearch:${TAG:-latest}
dataprep-minio-lancedb:
build:
dockerfile: comps/dataprep/minio/lancedb/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-minio-lancedb:${TAG:-latest}
dataprep-minio-milvus:
build:
dockerfile: comps/dataprep/minio/milvus/langchain/Dockerfile
image: ${REGISTRY:-opea}/dataprep-minio-milvus:${TAG:-latest}
4 changes: 4 additions & 0 deletions .github/workflows/docker/compose/retrievers-compose.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -51,3 +51,7 @@ services:
build:
dockerfile: comps/retrievers/opensearch/langchain/Dockerfile
image: ${REGISTRY:-opea}/retriever-opensearch:${TAG:-latest}
retriever-minio-lancedb:
build:
dockerfile: comps/retrievers/minio/lancedb/langchain/Dockerfile
image: ${REGISTRY:-opea}/retriever-minio-lancedb:${TAG:-latest}
2 changes: 2 additions & 0 deletions comps/dataprep/minio/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
# Copyright (c) 2015-2024 MinIO, Inc.
# SPDX-License-Identifier: Apache-2.0
38 changes: 38 additions & 0 deletions comps/dataprep/minio/lancedb/langchain/Dockerfile
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
# Copyright (c) 2015-2024 MinIO, Inc.
# SPDX-License-Identifier: Apache-2.0

FROM python:3.11-slim

ENV LANG=C.UTF-8

ARG ARCH="cpu"

RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
build-essential \
default-jre \
libgl1-mesa-glx \
libjemalloc-dev \
tesseract-ocr

RUN useradd -m -s /bin/bash user && \
mkdir -p /home/user && \
chown -R user /home/user/

USER user

COPY comps /home/user/comps

RUN pip install --no-cache-dir --upgrade pip setuptools && \
if [ ${ARCH} = "cpu" ]; then pip install --no-cache-dir torch torchvision --index-url https://download.pytorch.org/whl/cpu; fi && \
pip install --no-cache-dir -r /home/user/comps/dataprep/minio/lancedb/langchain/requirements.txt

ENV PYTHONPATH=$PYTHONPATH:/home/user

USER root

RUN mkdir -p /home/user/comps/dataprep/minio/lancedb/langchain/uploaded_files && chown -R user /home/user/comps/dataprep/minio/lancedb/langchain/uploaded_files

USER user
WORKDIR /home/user/comps/dataprep/minio/lancedb/langchain

ENTRYPOINT ["python", "prepare_doc_lancedb.py"]
Loading
Loading