nv-morpheus · bsuryadevara · Dec 11, 2023 · Dec 11, 2023 · Dec 11, 2023 · Dec 11, 2023
@@ -1,4 +1,4 @@
-# SPDX-FileCopyrightText: Copyright (c) 2022-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-FileCopyrightText: Copyright (c) 2022-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 # SPDX-License-Identifier: Apache-2.0
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
@@ -36,11 +36,10 @@ dependencies:
  - dill=0.3.6
  - distributed>=2023.1.1
  - huggingface_hub=0.10.1 # work-around for https://github.com/UKPLab/sentence-transformers/issues/1762
- - langchain=0.0.190
  - libwebp>=1.3.2 # Required for CVE mitigation: https://nvd.nist.gov/vuln/detail/CVE-2023-4863
  - mlflow>=2.2.1,<3
  - newspaper3k=0.2
- - openai=0.28
+ - numexpr=2.8.7
  - papermill=2.3.4
  - pypdf=3.16
  - requests-cache=1.1
@@ -59,6 +58,9 @@ dependencies:
 
  ####### Pip Dependencies (keep sorted!) #######
  - pip:
+ - farm-haystack==1.22.1
  - google-search-results==2.4
  - grpcio-status==1.58 # To keep in sync with 1.58 grpcio which is installed for Morpheus
+ - langchain==0.0.351
+ - llama-index==0.9.16.post1
  - nemollm
@@ -1,5 +1,5 @@
 <!--
-SPDX-FileCopyrightText: Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+SPDX-FileCopyrightText: Copyright (c) 2023-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 SPDX-License-Identifier: Apache-2.0
 
 Licensed under the Apache License, Version 2.0 (the "License");
@@ -51,7 +51,7 @@ The pipeline supports different agent types, each influencing the pattern for in
 Depending on the problem at hand, various tools can be provided to LLM agents, such as internet searches, VDB retrievers, calculators, Wikipedia, etc. In this example, we'll use the internet search tool and an llm-math tool, allowing the LLM agent to perform Google searches and solve math equations.
 
 ### LLM Library
-The pipeline utilizes the Langchain library to run LLM agents, enabling their execution directly within a Morpheus pipeline. This approach reduces the overhead of migrating existing systems to Morpheus and eliminates the need to replicate work done by popular LLM libraries like llama-index and Haystack.
+The pipeline utilizes the Langchain, Haystack library to run LLM agents, enabling their execution directly within a Morpheus pipeline. This approach reduces the overhead of migrating existing systems to Morpheus and eliminates the need to replicate work done by popular LLM libraries like llama-index and Haystack.
 
 ## Pipeline Implementation
 - **InMemorySourceStage**: Manages LLM queries in a DataFrame.
@@ -90,6 +90,17 @@ SerpApi API key. Set the API key as an environment variable using the following
 export SERPAPI_API_KEY="<YOUR_SERPAPI_API_KEY>"
 ```
 
+**Serper Dev API Key**
+
+Go to [SerperDev](https://serper.dev/login) to register and create an account. Once registered, obtain your
+Serper Dev API key. Set the API key as an environment variable using the following command:
+
+```bash
+export SERPERDEV_API_KEY="<SERPER_API_KEY>"
+```
+
+Note: This is required when using the Haystack LLM orchestration framework in the pipeline.
+
 #### Install Dependencies
 
 Install the required dependencies.
@@ -120,7 +131,7 @@ This example demonstrates the basic implementation of Morpheus pipeline, showcas
 
 
 ```bash
-python exmaples/llm/main.py agents simple [OPTIONS]
+python examples/llm/main.py agents simple [OPTIONS]
 ```
 
 ### Options:
@@ -144,6 +155,12 @@ python exmaples/llm/main.py agents simple [OPTIONS]
 - `--repeat_count INTEGER RANGE`
  - **Description**: Number of times to repeat the input query. Useful for testing performance.
  - **Default**: `1`
+
+- `--llm_orch TEXT`
+ - **Chioce**: `[haystack|langchain|llama_index]`
+ - **Description**: The name of the model to use in OpenAI.
+ - **Default**: `langchain`
+
 - `--help`
  - **Description**: Show the help message with options and commands details.
 
@@ -172,7 +189,7 @@ kafka-topics.sh --bootstrap-server ${BOOTSTRAP_SERVER} --alter --topic input --p
 Now Kafka example can be run using the following command with the below listed options:
 
 ```bash
-python exmaples/llm/main.py agents kafka [OPTIONS]
+python examples/llm/main.py agents kafka [OPTIONS]
 ```
 
 ### Options:
@@ -193,6 +210,11 @@ python exmaples/llm/main.py agents kafka [OPTIONS]
  - **Description**: The name of the model to use in OpenAI.
  - **Default**: `gpt-3.5-turbo-instruct`
 
+- `--llm_orch TEXT`
+ - **Chioce**: `[haystack|langchain]`
+ - **Description**: The name of the model to use in OpenAI.
+ - **Default**: `langchain`
+
 - `--help`
  - **Description**: Show the help message with options and commands details.
 

@@ -1,4 +1,4 @@
-# Copyright (c) 2023, NVIDIA CORPORATION.
+# Copyright (c) 2023-2024, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,55 +15,22 @@
 import logging
 import time
 
-from langchain.agents import AgentType
-from langchain.agents import initialize_agent
-from langchain.agents import load_tools
-from langchain.agents.agent import AgentExecutor
-from langchain.llms.openai import OpenAIChat
-
 from morpheus.config import Config
 from morpheus.config import PipelineModes
-from morpheus.llm import LLMEngine
-from morpheus.llm.nodes.extracter_node import ExtracterNode
-from morpheus.llm.nodes.langchain_agent_node import LangChainAgentNode
-from morpheus.llm.task_handlers.simple_task_handler import SimpleTaskHandler
 from morpheus.messages import ControlMessage
 from morpheus.pipeline.linear_pipeline import LinearPipeline
 from morpheus.stages.input.kafka_source_stage import KafkaSourceStage
 from morpheus.stages.llm.llm_engine_stage import LLMEngineStage
 from morpheus.stages.output.in_memory_sink_stage import InMemorySinkStage
 from morpheus.stages.preprocess.deserialize_stage import DeserializeStage
 
-logger = logging.getLogger(__name__)
-
-
-def _build_agent_executor(model_name: str) -> AgentExecutor:
-
- llm = OpenAIChat(model=model_name, temperature=0)
-
- tools = load_tools(["serpapi", "llm-math"], llm=llm)
-
- agent_executor = initialize_agent(tools, llm, agent=AgentType.ZERO_SHOT_REACT_DESCRIPTION, verbose=True)
-
- return agent_executor
+from ..common.engine_builder import build_engine_with_agent_node
 
-
-def _build_engine(model_name: str) -> LLMEngine:
-
- engine = LLMEngine()
-
- engine.add_node("extracter", node=ExtracterNode())
-
- engine.add_node("agent",
- inputs=[("/extracter")],
- node=LangChainAgentNode(agent_executor=_build_agent_executor(model_name=model_name)))
-
- engine.add_task_handler(inputs=["/extracter"], handler=SimpleTaskHandler())
-
- return engine
+logger = logging.getLogger(__name__)
 
 
-def pipeline(num_threads: int, pipeline_batch_size: int, model_max_batch_size: int, model_name: str) -> float:
+def pipeline(num_threads: int, pipeline_batch_size: int, model_max_batch_size: int, model_name: str,
+ llm_orch: str) -> float:
  config = Config()
  config.mode = PipelineModes.OTHER
 
@@ -85,7 +52,8 @@ def pipeline(num_threads: int, pipeline_batch_size: int, model_max_batch_size: i
 
  # pipe.add_stage(MonitorStage(config, description="Source rate", unit='questions'))
 
- pipe.add_stage(LLMEngineStage(config, engine=_build_engine(model_name=model_name)))
+ pipe.add_stage(LLMEngineStage(config, engine=build_engine_with_agent_node(model_name=model_name,
+ llm_orch=llm_orch)))
 
  sink = pipe.add_stage(InMemorySinkStage(config))
 

@@ -1,4 +1,4 @@
-# SPDX-FileCopyrightText: Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-FileCopyrightText: Copyright (c) 2023-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 # SPDX-License-Identifier: Apache-2.0
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
@@ -18,7 +18,7 @@ channels:
  - conda-forge
  - defaults
 dependencies:
- - langchain=0.0.190
+ - numexpr=2.8.7
  - pip
  - requests-cache=1.1
  - sentence-transformers
@@ -31,5 +31,8 @@ dependencies:
 
  ####### Pip Dependencies (keep sorted!) #######
  - pip:
+ - farm-haystack==1.22.1
+ - langchain==0.0.351
+ - llama-index==0.9.16.post1
  - grpcio-status==1.58 # To keep in sync with 1.58 grpcio which is installed for Morpheus
  - nemollm
@@ -1,4 +1,4 @@
-# Copyright (c) 2023, NVIDIA CORPORATION.
+# Copyright (c) 2023-2024, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -57,6 +57,12 @@ def run():
  type=click.IntRange(min=1),
  help="Number of times to repeat the input query. Useful for testing performance.",
 )
+@click.option(
+ "--llm_orch",
+ default="langchain",
+ type=click.Choice(["haystack", "langchain", "llama_index"], case_sensitive=False),
+ help="LLM orchestration frameworks, that you can use to include in the pipeline.",
+)
 def simple(**kwargs):
 
  from .simple_pipeline import pipeline as _pipeline
@@ -91,6 +97,12 @@ def simple(**kwargs):
  default='gpt-3.5-turbo-instruct',
  help="The name of the model to use in OpenAI",
 )
+@click.option(
+ "--llm_orch",
+ default="langchain",
+ type=click.Choice(["haystack", "langchain"], case_sensitive=False),
+ help="LLM orchestration frameworks, that you can use to include in the pipeline.",
+)
 def kafka(**kwargs):
 
  from .kafka_pipeline import pipeline as _pipeline

@@ -1,4 +1,4 @@
-# Copyright (c) 2023, NVIDIA CORPORATION.
+# Copyright (c) 2023-2024, NVIDIA CORPORATION.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,20 +15,10 @@
 import logging
 import time
 
-from langchain import OpenAI
-from langchain.agents import AgentType
-from langchain.agents import initialize_agent
-from langchain.agents import load_tools
-from langchain.agents.agent import AgentExecutor
-
 import cudf
 
 from morpheus.config import Config
 from morpheus.config import PipelineModes
-from morpheus.llm import LLMEngine
-from morpheus.llm.nodes.extracter_node import ExtracterNode
-from morpheus.llm.nodes.langchain_agent_node import LangChainAgentNode
-from morpheus.llm.task_handlers.simple_task_handler import SimpleTaskHandler
 from morpheus.messages import ControlMessage
 from morpheus.pipeline.linear_pipeline import LinearPipeline
 from morpheus.stages.general.monitor_stage import MonitorStage
@@ -38,42 +28,17 @@
 from morpheus.stages.preprocess.deserialize_stage import DeserializeStage
 from morpheus.utils.concat_df import concat_dataframes
 
-logger = logging.getLogger(__name__)
-
-
-def _build_agent_executor(model_name: str) -> AgentExecutor:
-
- llm = OpenAI(model=model_name, temperature=0)
-
- tools = load_tools(["serpapi", "llm-math"], llm=llm)
-
- agent_executor = initialize_agent(tools, llm, agent=AgentType.ZERO_SHOT_REACT_DESCRIPTION, verbose=True)
-
- return agent_executor
+from ..common.engine_builder import build_engine_with_agent_node
 
-
-def _build_engine(model_name: str) -> LLMEngine:
-
- engine = LLMEngine()
-
- engine.add_node("extracter", node=ExtracterNode())
-
- engine.add_node("agent",
- inputs=[("/extracter")],
- node=LangChainAgentNode(agent_executor=_build_agent_executor(model_name=model_name)))
-
- engine.add_task_handler(inputs=["/agent"], handler=SimpleTaskHandler())
-
- return engine
+logger = logging.getLogger(__name__)
 
 
-def pipeline(
- num_threads: int,
- pipeline_batch_size,
- model_max_batch_size,
- model_name,
- repeat_count,
-) -> float:
+def pipeline(num_threads: int,
+ pipeline_batch_size: int,
+ model_max_batch_size: int,
+ model_name: str,
+ repeat_count: int,
+ llm_orch: str) -> float:
  config = Config()
  config.mode = PipelineModes.OTHER
 
@@ -85,8 +50,12 @@ def pipeline(
  config.edge_buffer_size = 128
 
  source_dfs = [
- cudf.DataFrame(
- {"questions": ["Who is Leo DiCaprio's girlfriend? What is her current age raised to the 0.43 power?"]})
+ cudf.DataFrame({
+ "questions": [
+ "Who is Leo DiCaprio's girlfriend? What is her current age raised to the 0.43 power?",
+ "Who is the 7th president of United States?"
+ ]
+ })
  ]
 
  completion_task = {"task_type": "completion", "task_dict": {"input_keys": ["questions"], }}
@@ -100,7 +69,8 @@ def pipeline(
 
  pipe.add_stage(MonitorStage(config, description="Source rate", unit='questions'))
 
- pipe.add_stage(LLMEngineStage(config, engine=_build_engine(model_name=model_name)))
+ pipe.add_stage(LLMEngineStage(config, engine=build_engine_with_agent_node(model_name=model_name,
+ llm_orch=llm_orch)))
 
  sink = pipe.add_stage(InMemorySinkStage(config))