opea-project
diff --git a/‎.github/workflows/docker/compose/llms-compose-cd.yaml
Lines changed: 5 additions & 1 deletion b/‎.github/workflows/docker/compose/llms-compose-cd.yaml
Lines changed: 5 additions & 1 deletion
diff --git a/‎comps/llms/text-generation/native/langchain/Dockerfile
Lines changed: 41 additions & 0 deletions b/‎comps/llms/text-generation/native/langchain/Dockerfile
Lines changed: 41 additions & 0 deletions
diff --git a/‎comps/llms/text-generation/native/README.md renamed to ‎comps/llms/text-generation/native/langchain/README.md
Lines changed: 3 additions & 2 deletions b/‎comps/llms/text-generation/native/README.md renamed to ‎comps/llms/text-generation/native/langchain/README.md
Lines changed: 3 additions & 2 deletions
diff --git a/‎comps/llms/text-generation/native/docker_compose_llm.yaml renamed to ‎comps/llms/text-generation/native/langchain/docker_compose_llm.yaml b/‎comps/llms/text-generation/native/docker_compose_llm.yaml renamed to ‎comps/llms/text-generation/native/langchain/docker_compose_llm.yaml
diff --git a/‎comps/llms/text-generation/native/llm.py renamed to ‎comps/llms/text-generation/native/langchain/llm.py b/‎comps/llms/text-generation/native/llm.py renamed to ‎comps/llms/text-generation/native/langchain/llm.py
diff --git a/‎comps/llms/text-generation/native/requirements.txt renamed to ‎comps/llms/text-generation/native/langchain/requirements.txt b/‎comps/llms/text-generation/native/requirements.txt renamed to ‎comps/llms/text-generation/native/langchain/requirements.txt
diff --git a/‎comps/llms/text-generation/native/template.py renamed to ‎comps/llms/text-generation/native/langchain/template.py b/‎comps/llms/text-generation/native/template.py renamed to ‎comps/llms/text-generation/native/langchain/template.py
diff --git a/‎comps/llms/text-generation/native/utils.py renamed to ‎comps/llms/text-generation/native/langchain/utils.py b/‎comps/llms/text-generation/native/utils.py renamed to ‎comps/llms/text-generation/native/langchain/utils.py
diff --git a/‎comps/llms/text-generation/native/Dockerfile renamed to ‎comps/llms/text-generation/native/llama_index/Dockerfile
Lines changed: 2 additions & 2 deletions b/‎comps/llms/text-generation/native/Dockerfile renamed to ‎comps/llms/text-generation/native/llama_index/Dockerfile
Lines changed: 2 additions & 2 deletions
diff --git a/‎comps/llms/text-generation/native/llama_index/README.md
Lines changed: 60 additions & 0 deletions b/‎comps/llms/text-generation/native/llama_index/README.md
Lines changed: 60 additions & 0 deletions
@@ -4,8 +4,12 @@
 services:
   llm-native:
     build:
-      dockerfile: comps/llms/text-generation/native/Dockerfile
+      dockerfile: comps/llms/text-generation/native/langchain/Dockerfile
     image: ${REGISTRY:-opea}/llm-native:${TAG:-latest}
+  llm-native-llamaindex:
+    build:
+      dockerfile: comps/llms/text-generation/native/llama_index/Dockerfile
+    image: ${REGISTRY:-opea}/llm-native-llamaindex:${TAG:-latest}
   vllm-openvino:
     build:
       context: vllm-openvino
 
@@ -0,0 +1,41 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# HABANA environment
+# FROM vault.habana.ai/gaudi-docker/1.16.1/ubuntu22.04/habanalabs/pytorch-installer-2.2.2:latest as hpu
+FROM opea/habanalabs:1.16.1-pytorch-installer-2.2.2 as hpu
+
+ENV LANG=en_US.UTF-8
+ARG REPO=https://github.com/huggingface/optimum-habana.git
+ARG REPO_VER=v1.12.1
+
+RUN apt-get update && apt-get install -y --no-install-recommends --fix-missing \
+    git-lfs \
+    libgl1-mesa-glx \
+    libjemalloc-dev
+
+RUN useradd -m -s /bin/bash user && \
+    mkdir -p /home/user && \
+    chown -R user /home/user/
+
+USER user
+
+RUN git lfs install
+
+COPY comps /home/user/comps
+
+RUN pip install --no-cache-dir --upgrade-strategy eager optimum[habana] && \
+    pip install --no-cache-dir git+https://github.com/HabanaAI/[email protected]
+
+RUN git clone ${REPO} /home/user/optimum-habana && \
+    cd /home/user/optimum-habana && git checkout ${REPO_VER} && \
+    cd examples/text-generation && pip install --no-cache-dir -r requirements.txt && \
+    cd /home/user/comps/llms/text-generation/native/langchain && \
+    pip install --no-cache-dir -r requirements.txt && \
+    pip install --no-cache-dir --upgrade --force-reinstall pydantic
+
+ENV PYTHONPATH=/root:/home/user
+
+WORKDIR /home/user/comps/llms/text-generation/native/langchain
+
+ENTRYPOINT ["python", "llm.py"]
@@ -17,8 +17,9 @@ export LLM_NATIVE_MODEL="Qwen/Qwen2-7B-Instruct"
 ### 1.2 Build Docker Image
 
 ```bash
-cd ../../../../
-docker build -t opea/llm-native:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/llms/text-generation/native/Dockerfile .
+cd ../../../../../
+docker build -t opea/llm-native:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/llms/text-generation/native/langchain
+Dockerfile .
 ```
 
 To start a docker container, you have two options:
 
@@ -30,11 +30,11 @@ RUN pip install --no-cache-dir --upgrade-strategy eager optimum[habana] && \
 RUN git clone ${REPO} /home/user/optimum-habana && \
     cd /home/user/optimum-habana && git checkout ${REPO_VER} && \
     cd examples/text-generation && pip install --no-cache-dir -r requirements.txt && \
-    cd /home/user/comps/llms/text-generation/native && pip install --no-cache-dir -r requirements.txt && \
+    cd /home/user/comps/llms/text-generation/native/llama_index && pip install --no-cache-dir -r requirements.txt && \
     pip install --no-cache-dir --upgrade --force-reinstall pydantic
 
 ENV PYTHONPATH=/root:/home/user
 
-WORKDIR /home/user/comps/llms/text-generation/native
+WORKDIR /home/user/comps/llms/text-generation/native/llama_index
 
 ENTRYPOINT ["python", "llm.py"]
@@ -0,0 +1,60 @@
+# LLM Native Microservice
+
+LLM Native microservice uses [optimum-habana](https://github.com/huggingface/optimum-habana) for model initialization and warm-up, focusing solely on large language models (LLMs). It operates without frameworks like TGI/VLLM, using PyTorch directly for inference, and supports only non-streaming formats. This streamlined approach optimizes performance on Habana hardware.
+
+## 🚀1. Start Microservice
+
+If you start an LLM microservice with docker, the `docker_compose_llm.yaml` file will automatically start a Native LLM service with docker.
+
+### 1.1 Setup Environment Variables
+
+In order to start Native LLM service, you need to setup the following environment variables first.
+
+```bash
+export LLM_NATIVE_MODEL="Qwen/Qwen2-7B-Instruct"
+```
+
+### 1.2 Build Docker Image
+
+```bash
+cd ../../../../../
+docker build -t opea/llm-native:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/llms/text-generation/native/llama_index/Dockerfile .
+```
+
+To start a docker container, you have two options:
+
+- A. Run Docker with CLI
+- B. Run Docker with Docker Compose
+
+You can choose one as needed.
+
+### 1.3 Run Docker with CLI (Option A)
+
+```bash
+docker run -d --runtime=habana --name="llm-native-server" -p 9000:9000 -e https_proxy=$https_proxy -e http_proxy=$http_proxy -e TOKENIZERS_PARALLELISM=false -e HABANA_VISIBLE_DEVICES=all -e OMPI_MCA_btl_vader_single_copy_mechanism=none --cap-add=sys_nice --ipc=host -e LLM_NATIVE_MODEL=${LLM_NATIVE_MODEL} opea/llm-native:latest
+```
+
+### 1.4 Run Docker with Docker Compose (Option B)
+
+```bash
+docker compose -f docker_compose_llm.yaml up -d
+```
+
+## 🚀2. Consume LLM Service
+
+### 2.1 Check Service Status
+
+```bash
+curl http://${your_ip}:9000/v1/health_check\
+  -X GET \
+  -H 'Content-Type: application/json'
+```
+
+### 2.2 Consume LLM Service
+
+```bash
+curl http://${your_ip}:9000/v1/chat/completions\
+  -X POST \
+  -d '{"query":"What is Deep Learning?"}' \
+  -H 'Content-Type: application/json'
+```