Add example model artifacts.

qiuosier · qiuosier · commit 9f5be6adba4e · 2024-10-23T16:17:26.000-04:00
diff --git a/LLM/deployment/model_artifacts/app.py b/LLM/deployment/model_artifacts/app.py
@@ -0,0 +1,6 @@
+"""This module is a bare minimum example of an application.
+"""
+
+
+def invoke(inputs):
+    return {"message": f"This is an example app. You inputs are: {str(inputs)}"}
diff --git a/LLM/deployment/model_artifacts/exchange_rate.py b/LLM/deployment/model_artifacts/exchange_rate.py
@@ -0,0 +1,79 @@
+"""This module contains a LangChain agent example to answer question about currency exchange.
+
+It uses OCI Generative AI as the LLM to:
+1. Generate arguments for tool calling for obtaining the exchange rate.
+2. Process the tool calling results (exchange rates in JSON payload).
+3. Answer the user's question.
+
+This module requires the following environment variable:
+* PROJECT_COMPARTMENT_OCID, the compartment OCID for access OCI Generative AI service.
+
+By default, OCI model deployment can only access the OCI Generative AI endpoints
+within the same region. Custom networking for the model deployment is required 
+if you deploy the app in a different region.
+
+Custom networking with internet access is required for this app to run the get_exchange_rate() function.
+
+For more information on custom networking, see:
+https://docs.oracle.com/en-us/iaas/data-science/using/model-dep-create-cus-net.htm
+
+"""
+
+import os
+import requests
+from langchain.agents import create_tool_calling_agent, AgentExecutor
+from langchain_community.chat_models.oci_generative_ai import ChatOCIGenAI
+from langchain_core.tools import tool
+from langchain_core.prompts import ChatPromptTemplate
+
+
+# Use LLM from OCI generative AI service
+llm = ChatOCIGenAI(
+    model_id="cohere.command-r-plus",
+    # Service endpoint is not needed if the generative AI is available in the same region.
+    # service_endpoint="https://inference.generativeai.us-chicago-1.oci.oraclecloud.com",
+    # Make sure you configure custom networking if you use a service endpoint in a different region.
+    compartment_id=os.environ["PROJECT_COMPARTMENT_OCID"],
+    model_kwargs={"temperature": 0, "max_tokens": 4000},
+    auth_type="RESOURCE_PRINCIPAL",
+)
+
+
+@tool
+def get_exchange_rate(currency: str) -> str:
+    """Obtain the current exchange rates of a currency to other currencies.
+    
+    Parameters
+    ----------
+    currency : str
+        Currency in ISO 4217 3-letter currency code
+        
+    Returns
+    -------
+    dict:
+        The value of `rates` is a dictionary contains the exchange rates to other currencies,
+        in which the keys are the ISO 4217 3-letter currency codes.
+    """
+
+    response = requests.get(f"https://open.er-api.com/v6/latest/{currency}", timeout=10)
+    return response.json()
+
+
+tools = [get_exchange_rate]
+prompt = ChatPromptTemplate.from_messages(
+    [
+        ("system", "You are a helpful assistant"),
+        ("placeholder", "{chat_history}"),
+        ("human", "{input}"),
+        ("placeholder", "{agent_scratchpad}"),
+    ]
+)
+
+agent = create_tool_calling_agent(llm, tools, prompt)
+agent_executor = AgentExecutor(
+    agent=agent, tools=tools, verbose=True, return_intermediate_steps=False
+)
+
+
+def invoke(message):
+    return agent_executor.invoke({"input": message})
diff --git a/LLM/deployment/model_artifacts/graph.py b/LLM/deployment/model_artifacts/graph.py
@@ -0,0 +1,239 @@
+"""LangGraph application containing a research node and a chat node
+Adapted from https://langchain-ai.github.io/langgraph/tutorials/multi_agent/multi-agent-collaboration/
+
+This module requires the following environment variable:
+* PROJECT_COMPARTMENT_OCID, the compartment OCID for access OCI Generative AI service.
+
+Custom networking with internet access is required for this app to run Tavily search tool.
+
+For more information on custom networking, see:
+https://docs.oracle.com/en-us/iaas/data-science/using/model-dep-create-cus-net.htm
+"""
+
+import base64
+import os
+import operator
+import tempfile
+import traceback
+from typing import Annotated, Sequence
+from typing_extensions import TypedDict
+
+from ads.config import COMPARTMENT_OCID
+from langchain_community.chat_models.oci_generative_ai import ChatOCIGenAI
+from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_core.messages import (
+    AIMessage,
+    BaseMessage,
+    HumanMessage,
+    ToolMessage,
+)
+from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain_core.tools import tool
+from langchain_experimental.utilities import PythonREPL
+from langgraph.prebuilt import ToolNode
+from langgraph.graph import START, END, StateGraph
+
+# Use LLM from OCI generative AI service
+llm = ChatOCIGenAI(
+    model_id="cohere.command-r-plus",
+    # Service endpoint is not needed if the generative AI is available in the same region.
+    # service_endpoint="https://inference.generativeai.us-chicago-1.oci.oraclecloud.com",
+    compartment_id=COMPARTMENT_OCID,
+    model_kwargs={"temperature": 0, "max_tokens": 4000},
+    auth_type="RESOURCE_PRINCIPAL",
+)
+
+# Search tool
+tavily_tool = TavilySearchResults(max_results=5)
+
+# Python code execution tool
+repl = PythonREPL()
+
+
+@tool
+def python_repl(
+    code: Annotated[str, "The python code to execute to generate your chart."],
+):
+    """Use this to execute python code. If you want to see the output of a value,
+    you should print it out with `print(...)`. This is visible to the user."""
+    try:
+        # Set the timeout so the code will be run in a separated process
+        # This will avoid the code changing variables in the current process.
+        result = repl.run(code, timeout=30)
+    except BaseException as e:
+        return f"Failed to execute. Error: {repr(e)}"
+    result_str = f"Successfully executed:\n```python\n{code}\n```\nStdout: {result}"
+    return result_str
+
+
+class AgentState(TypedDict):
+    """Represents the state of the agents"""
+
+    messages: Annotated[Sequence[BaseMessage], operator.add]
+    sender: str
+
+
+class AgentNode:
+    """Represents an agent node."""
+
+    def __init__(self, name, llm, system_message, tools=None) -> None:
+        self.name = name
+        instructions = (
+            "You are a helpful AI agent,"
+            " collaborating with other agents work on a task step by step."
+            " If you are unable to fully finish it, another agent may help where you left off."
+            " Execute what you can to make progress."
+            " If you or any of the other assistants have the final answer,"
+            " or the team cannot make any progress,"
+            " prefix your response with FINAL ANSWER so the team knows to stop."
+        )
+        if tools:
+            tool_names = ", ".join([tool.name for tool in tools])
+            instructions += f" You have access to the following tools: {tool_names}.\n"
+            llm = llm.bind_tools(tools)
+        instructions += system_message
+        prompt = ChatPromptTemplate.from_messages(
+            [
+                (
+                    "system",
+                    instructions,
+                ),
+                MessagesPlaceholder(variable_name="messages"),
+            ]
+        )
+        prompt = prompt.partial(system_message=system_message)
+        self.agent = prompt | llm
+
+    def __call__(self, state: AgentState) -> dict:
+        result = self.agent.invoke(state)
+        # We convert the agent output into a format that is suitable to append to the global state
+        if not isinstance(result, ToolMessage):
+            result = AIMessage(**result.dict(exclude={"type", "name"}), name=self.name)
+        return {
+            "messages": [result],
+            # Since we have a strict workflow, we can
+            # track the sender so we know who to pass to next.
+            "sender": self.name,
+        }
+
+
+# Nodes
+RESEARCH_NODE = "research_node"
+CHART_NODE = "chart_node"
+
+# research
+research_node = AgentNode(
+    RESEARCH_NODE,
+    llm,
+    system_message="You should provide accurate data for plotting the chart.",
+    tools=[tavily_tool],
+)
+
+
+# temp dir for saving the chart
+# Each thread will get a different temp dir
+tmp_dir = tempfile.TemporaryDirectory()
+print(f"Temp directory: {tmp_dir.name}")
+tmp_file = os.path.join(tmp_dir.name, "chart.png")
+# chart
+chart_node = AgentNode(
+    CHART_NODE,
+    llm,
+    system_message=(
+        f"Run Python code to plot the chart and save it to a file named {tmp_file}. "
+        "Response FINAL ANSWER once the chart is plotted successfully."
+    ),
+    tools=[python_repl],
+)
+
+search_tool = ToolNode([tavily_tool])
+chart_tool = ToolNode([python_repl])
+SEARCH_TOOL = "search_tool"
+CHART_TOOL = "chart_tool"
+
+
+def research_path(state):
+    """Router for research_node"""
+    messages = state["messages"]
+    last_message = messages[-1]
+    if "FINAL ANSWER" in last_message.content:
+        # Any agent decided the work is done
+        return END
+    if last_message.tool_calls:
+        return SEARCH_TOOL
+    else:
+        return CHART_NODE
+
+
+def chart_path(state):
+    """Router for chart_node."""
+    messages = state["messages"]
+    last_message = messages[-1]
+    if "FINAL ANSWER" in last_message.content:
+        # Any agent decided the work is done
+        return END
+    if last_message.tool_calls:
+        return CHART_TOOL
+    else:
+        return RESEARCH_NODE
+
+
+workflow = StateGraph(AgentState)
+
+workflow.add_node(CHART_NODE, chart_node)
+workflow.add_node(RESEARCH_NODE, research_node)
+
+workflow.add_node(SEARCH_TOOL, search_tool)
+workflow.add_node(CHART_TOOL, chart_tool)
+
+workflow.add_edge(START, RESEARCH_NODE)
+
+workflow.add_conditional_edges(
+    RESEARCH_NODE, research_path, {n: n for n in [SEARCH_TOOL, CHART_NODE, END]}
+)
+workflow.add_conditional_edges(
+    CHART_NODE, chart_path, {n: n for n in [CHART_TOOL, RESEARCH_NODE, END]}
+)
+
+
+workflow.add_edge(CHART_TOOL, CHART_NODE)
+workflow.add_edge(SEARCH_TOOL, RESEARCH_NODE)
+
+
+graph = workflow.compile()
+
+
+def invoke(message):
+    """Invokes the graph."""
+    events = graph.stream(
+        {
+            "messages": [HumanMessage(content=message)],
+        },
+        # Maximum number of steps to take in the graph
+        {"recursion_limit": 10},
+    )
+
+    # Print and save the messages
+    messages = []
+    for event in events:
+        for node, value in event.items():
+            print(node)
+            print("-" * 50)
+            message = value["messages"][-1].content
+            messages.append(message)
+            print(message)
+        print("=" * 50)
+
+    # Load the chart and encode it with base64
+    if os.path.exists(tmp_file):
+        with open(tmp_file, mode="rb") as f:
+            chart = base64.b64encode(f.read()).decode()
+            print(f"Loaded chart from {tmp_file}")
+        try:
+            os.remove(tmp_file)
+        except Exception:
+            print(f"Failed to remove file {tmp_file}.")
+            traceback.print_exc()
+    else:
+        chart = None
+    return {"chart": chart, "messages": messages}
diff --git a/LLM/deployment/model_artifacts/long_running.py b/LLM/deployment/model_artifacts/long_running.py
@@ -0,0 +1,16 @@
+"""This module contains a invoke() function that runs for more than 1 minute.
+
+To invoke this with model deployment, make sure you specify the "async" parameter
+in the payload to save the results into OCI object storage.
+"""
+
+import time
+
+
+def invoke(inputs):
+    f_time = time.time()
+    time.sleep(90)
+    t_time = time.time()
+    return {
+        "message": f"This is an example app running for {str(t_time - f_time)} seconds."
+    }
diff --git a/LLM/deployment/model_artifacts/runtime.yaml b/LLM/deployment/model_artifacts/runtime.yaml
@@ -0,0 +1,22 @@
+MODEL_ARTIFACT_VERSION: "3.0"
+MODEL_DEPLOYMENT:
+  INFERENCE_CONDA_ENV:
+    INFERENCE_ENV_PATH: ""
+    INFERENCE_ENV_SLUG: ""
+    INFERENCE_ENV_TYPE: ""
+    INFERENCE_PYTHON_VERSION: ""
+MODEL_PROVENANCE:
+  PROJECT_OCID: ""
+  TENANCY_OCID: ""
+  TRAINING_CODE:
+    ARTIFACT_DIRECTORY: /opt/ds/model/deployed_model
+  TRAINING_COMPARTMENT_OCID: ""
+  TRAINING_CONDA_ENV:
+    TRAINING_ENV_PATH: ""
+    TRAINING_ENV_SLUG: ""
+    TRAINING_ENV_TYPE: ""
+    TRAINING_PYTHON_VERSION: ""
+  TRAINING_REGION: ""
+  TRAINING_RESOURCE_OCID: ""
+  USER_OCID: ""
+  VM_IMAGE_INTERNAL_ID: ""
diff --git a/LLM/deployment/model_artifacts/score.py b/LLM/deployment/model_artifacts/score.py
diff --git a/LLM/deployment/model_artifacts/translate.py b/LLM/deployment/model_artifacts/translate.py