Spaces:

LunaticMaestro
/

N.AIQ2

Running

App Files Files Community

Deepak Sahu commited on May 20

Commit

97127b4

1 Parent(s): b70ec81

warm

Browse files

Files changed (21) hide show

.gitattributes +1 -0
.gitignore +1 -0
Dockerfile +24 -0
_data/retail_customer/Retail_Customer_Cluster_Data.xlsx +3 -0
_data/retail_customer/meta.md +19 -0
_data/retail_customer/readme.md +1 -0
config.yaml +26 -0
frontend.py +35 -0
pandas_expression_generator/pyproject.toml +18 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/PKG-INFO +7 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/SOURCES.txt +10 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/dependency_links.txt +1 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/entry_points.txt +2 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/requires.txt +1 -0
pandas_expression_generator/src/pandas_expression_generator.egg-info/top_level.txt +1 -0
pandas_expression_generator/src/pandas_expression_generator/__init__.py +0 -0
pandas_expression_generator/src/pandas_expression_generator/configs/config.yml +25 -0
pandas_expression_generator/src/pandas_expression_generator/pandas_expression_generator_function.py +154 -0
pandas_expression_generator/src/pandas_expression_generator/register.py +5 -0
requirements.txt +4 -0
start.sh +11 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.xlsx filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ *.pyc

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+# Use an official Python image
+FROM langchain/langchain
+# Set working directory
+WORKDIR /app
+# Copy your app files
+COPY  requirements.txt requirements.txt
+# Install dependencies (adjust as needed)
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+# Install agents
+# RUN pip install -e pandas_expression_generator
+# # Make the script executable
+# RUN chmod +x start.sh
+# Start both processes
+# CMD ["./start.sh"]

_data/retail_customer/Retail_Customer_Cluster_Data.xlsx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:643249aed77417875d9de227e9278f19a6fa015a27cccdcc1bfa6f30f96300ca
+size 14884

_data/retail_customer/meta.md ADDED Viewed

	@@ -0,0 +1,19 @@

+| Column Name               | Description                                          | Value Type  | Valid Data Regex / Allowed Values                  |
+|---------------------------|------------------------------------------------------|-------------|----------------------------------------------------|
+| CustomerID                | Unique customer identifier                          | Categorical | `CUST\d{3}`                                        |
+| Age                       | Age of the customer in years                        | Numerical   | `\d{1,3}`                                          |
+| Gender                    | Gender of the customer                              | Categorical | Male, Female, Other                                |
+| Income (Monthly)          | Monthly income of the customer                      | Numerical   | `\d+(\.\d+)?`                                      |
+| Location                  | Customer's city location                            | Categorical | Berlin, Hamburg, Cologne, Frankfurt                |
+| Purchase Frequency        | Number of purchases in a period                     | Numerical   | `\d+`                                              |
+| Avg. Transaction Value    | Average value per transaction                       | Numerical   | `\d+(\.\d+)?`                                      |
+| Loyalty Program Member    | Whether the customer is in loyalty program          | Categorical | Yes, No                                            |
+| Tenure (Months)           | How long they've been a customer (in months)        | Numerical   | `\d+`                                              |
+| Last Purchase Date        | Date of the last purchase                           | Date        | `\d{4}-\d{2}-\d{2}`     yyyy-mm-dd                           |
+| Total Spend (6M)          | Total spending in last 6 months                     | Numerical   | `\d+(\.\d+)?`                                      |
+| Visit Recency (Days)      | Days since last visit                               | Numerical   | `\d+`                                              |
+| Preferred Category        | Product category most often purchased               | Categorical | Grocery, Home, Beauty, Electronics                 |
+| Engagement Score          | Score representing user interaction                 | Numerical   | `\d+(\.\d+)?`                                      |
+| Value Score               | Score indicating customer value                     | Numerical   | `\d+(\.\d+)?`                                      |
+| Retention Risk Score      | Score estimating likelihood of customer churn       | Numerical   | `\d+(\.\d+)?`                                      |
+| Overall Customer Index    | Composite score for customer performance            | Numerical   | `\d+(\.\d+)?`                                      |

_data/retail_customer/readme.md ADDED Viewed

	@@ -0,0 +1 @@


1	+ this is a synthetic data generated out of chat gpt.

config.yaml ADDED Viewed

	@@ -0,0 +1,26 @@

+general:
+  use_uvloop: true
+  logging:
+    console:
+      _type: console
+      level: WARN
+  front_end:
+    _type: fastapi
+  front_end:
+    _type: console
+llms:
+  nim_llm:
+    _type: nim
+    model_name : meta/llama-3.1-405b-instruct
+    temperature: 0.0
+workflow:
+  _type: pandas_expression_generator
+  llm: nim_llm
+  csv_file: "/app/_data/retail_customer/Retail_Customer_Cluster_Data.xlsx"
+  csv_metafile: "/app/_data/retail_customer/meta.md"
+  description: "Use this tool to get data related to Customer Retails."

frontend.py ADDED Viewed

	@@ -0,0 +1,35 @@

+import gradio as gr
+import requests
+API_URL = "http://localhost:8000/chat"
+def chat_with_agentiq(message, history):
+    # Convert Gradio history to ChatML-style format
+    messages = []
+    for user_msg, agent_msg in history:
+        messages.append({"role": "User", "content": user_msg})
+        messages.append({"role": "Assistant", "content": agent_msg})
+    messages.append({"role": "User", "content": message})
+    payload = {
+        "messages": messages,
+        "model": "",  # Fill in your model name if required
+        "temperature": 0.7,
+        "max_tokens": 512,
+        "top_p": 1.0,
+        "additionalProp1": {}
+    }
+    try:
+        response = requests.post(API_URL, json=payload)
+        data = response.json()
+        reply = data["choices"][0]["message"]["content"]
+    except Exception as e:
+        reply = f"[Error: {str(e)}]"
+    return reply
+demo= gr.ChatInterface(fn=chat_with_agentiq, title="AgentIQ Chat")
+if __name__=="__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)

pandas_expression_generator/pyproject.toml ADDED Viewed

	@@ -0,0 +1,18 @@

+[build-system]
+build-backend = "setuptools.build_meta"
+requires = ["setuptools >= 64"]
+[project]
+name = "pandas_expression_generator"
+version = "0.1.0"
+dependencies = [
+  "aiqtoolkit[langchain]",
+]
+requires-python = ">=3.11,<3.13"
+description = "Custom AIQ Toolkit Workflow"
+classifiers = ["Programming Language :: Python"]
+[project.entry-points.'aiq.components']
+pandas_expression_generator = "pandas_expression_generator.register"

pandas_expression_generator/src/pandas_expression_generator.egg-info/PKG-INFO ADDED Viewed

	@@ -0,0 +1,7 @@

+Metadata-Version: 2.4
+Name: pandas_expression_generator
+Version: 0.1.0
+Summary: Custom AIQ Toolkit Workflow
+Classifier: Programming Language :: Python
+Requires-Python: <3.13,>=3.11
+Requires-Dist: aiqtoolkit[langchain]

pandas_expression_generator/src/pandas_expression_generator.egg-info/SOURCES.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+pyproject.toml
+src/pandas_expression_generator/__init__.py
+src/pandas_expression_generator/pandas_expression_generator_function.py
+src/pandas_expression_generator/register.py
+src/pandas_expression_generator.egg-info/PKG-INFO
+src/pandas_expression_generator.egg-info/SOURCES.txt
+src/pandas_expression_generator.egg-info/dependency_links.txt
+src/pandas_expression_generator.egg-info/entry_points.txt
+src/pandas_expression_generator.egg-info/requires.txt
+src/pandas_expression_generator.egg-info/top_level.txt

pandas_expression_generator/src/pandas_expression_generator.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+

pandas_expression_generator/src/pandas_expression_generator.egg-info/entry_points.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ [aiq.components]
2	+ pandas_expression_generator = pandas_expression_generator.register

pandas_expression_generator/src/pandas_expression_generator.egg-info/requires.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ aiqtoolkit[langchain]

pandas_expression_generator/src/pandas_expression_generator.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ pandas_expression_generator

pandas_expression_generator/src/pandas_expression_generator/__init__.py ADDED Viewed

File without changes

pandas_expression_generator/src/pandas_expression_generator/configs/config.yml ADDED Viewed

	@@ -0,0 +1,25 @@

+general:
+  use_uvloop: true
+  logging:
+    console:
+      _type: console
+      level: WARN
+  front_end:
+    _type: fastapi
+  front_end:
+    _type: console
+llms:
+  nim_llm:
+    _type: nim
+    model_name : meta/llama-3.1-405b-instruct
+    temperature: 0.0
+workflow:
+  _type: pandas_expression_generator
+  llm: nim_llm
+  csv_file: "/workspaces/do_aiq2/_data/retail_customer/Retail_Customer_Cluster_Data.xlsx"
+  csv_metafile: "/workspaces/do_aiq2/_data/retail_customer/meta.md"
+  description: "Use this agent to handles retail customers data"

pandas_expression_generator/src/pandas_expression_generator/pandas_expression_generator_function.py ADDED Viewed

	@@ -0,0 +1,154 @@

+import logging
+from pydantic import Field
+from aiq.builder.builder import Builder
+from aiq.builder.function_info import FunctionInfo
+from aiq.cli.register_workflow import register_function
+from aiq.data_models.function import FunctionBaseConfig
+from aiq.data_models.component_ref import LLMRef
+from aiq.builder.framework_enum import LLMFrameworkEnum
+from langchain_core.messages import AIMessage
+import pandas as pd
+from pydantic import BaseModel
+import numpy as np
+logger = logging.getLogger(__name__)
+class PandasExpressionGeneratorFunctionConfig(FunctionBaseConfig, name="pandas_expression_generator"):
+    """
+    AIQ Toolkit function template. Please update the description.
+    """
+    # Add your custom configuration parameters here
+    # parameter: str = Field(default="default_value", description="Notional description for this parameter")
+    llm: LLMRef
+    csv_file: str
+    csv_metafile: str
+    description: str = Field(default="A dataset query engine", description="Describe for which data the engine is used for")
+    max_retries: int = Field(default=2)
+class FunctionInput(BaseModel):
+    original_user_query: str = Field(description="The original user query as-is")
+    thought: str = Field(description="Describe what's essential to solve the query")
+    current_step: str = Field(description="Part of the intermediate step when resovling the big user query.")
+    next_step: str = Field(description="What next are we plannning to do once we perform the current step.")
+@register_function(config_type=PandasExpressionGeneratorFunctionConfig)
+async def pandas_expression_generator_function(
+    config: PandasExpressionGeneratorFunctionConfig, builder: Builder
+):
+    df: pd.DataFrame = pd.read_excel(config.csv_file)
+    with open(config.csv_metafile, "r", encoding="utf-8") as f:
+        df_meta: str = f.read()
+    def extract_bracket_content(text):
+        start = text.find('[')
+        end = text.rfind(']') + 1  # include the last ']'
+        if start == -1 or end == -1 or start >= end:
+            return ""  # return empty if brackets not found properly
+        return text[start:end]
+    import ast
+    def expression_executor(input_exp: str, df=None) -> tuple:
+        # Convert the input string to a list
+        commands = ast.literal_eval(input_exp)
+        # local_vars = dict([(str.strip, command.split('=', 1)) for command in commands])
+        local_vars:dict = dict([list(map(str.strip, command.split('=', 1))) for command in commands])
+        # Dictionary to simulate local scope
+        local_vars.update({'df': df, 'pd': pd, 'np': np})
+        # local_vars = {}
+        for command in commands:
+            exec(command, globals(), local_vars)
+        # for command in commands:
+        #     # Split at the first `=`
+        #     var, expr = map(str.strip, command.split('=', 1))
+        #     # Evaluate the expression in the local_vars context and assign to var
+        #     local_vars[var] = eval(expr, {}, local_vars)
+        return local_vars.get("output", None)
+        try:
+            output
+            # output = scope.get("output")
+        except Exception as e:
+            logger.error("[expression_executor] ", e)
+            output = None
+        return output  # return all evaluated variables
+    # Implement your function logic here
+    async def _response_fn(input_query: FunctionInput) -> str:
+        # Create LLM
+        llm_ = await builder.get_llm(config.llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
+        # Prompt
+        prompt_ = f'''You are a python expression generator.
+        Given the dataframe `df` and pandas import as `pd` which has the following metadata
+        CSV Meta
+        ---
+        {df_meta}
+        Generate python expression to solve the query:
+        current_step: {input_query.current_step}
+        You can reformulate(extend or reduce) the current step based on the following information
+        original_user_query: {input_query.original_user_query}
+        past_step: {input_query.thought}
+        next_step: {input_query.next_step}
+        You must generate list of python expressions output format must as follows:
+        [
+            "key_var = df[...]"                 // intermediate step
+            "key_var2 = key_var[df[...]...]"    // intermediate step
+                                                // reset the index of df if requrired
+                                                // convert the grouped dataframe to dictionaries
+                                                //
+            "output" = sting.  Have the string as list (records) of dictionaries (columns). Ensure to reset index if required
+        ]
+        Certain template questions and expected approach from you
+        1. When user wants to what is present in the data
+        > you should respond back with names of columns
+        Dont write reasoning; just list of strings which has python expressions
+        The list should not have markdown fencing.
+        '''
+        # just var declaration
+        df
+        try:
+            ai_message: AIMessage = await llm_.ainvoke(prompt_)
+            logger.info("[Following Should just be structured list of string]")
+            logger.info(ai_message)
+            structured_text_str = extract_bracket_content(ai_message.content)
+            output_message = str(expression_executor(structured_text_str, df))[:250]
+            #
+            # Loop break
+        except Exception as e:
+            logger.error(str(e))
+            logger.info("Retrying...")
+            output_message = "Unable to serve the request."
+            # output_message = f"Hello from pandas_expression_generator workflow! You said: {input_message}"
+        return output_message
+    try:
+        yield FunctionInfo.from_fn(
+            _response_fn,
+            description=config.description
+        )
+    except GeneratorExit:
+        print("Function exited early!")
+    finally:
+        print("Cleaning up pandas_expression_generator workflow.")

pandas_expression_generator/src/pandas_expression_generator/register.py ADDED Viewed

	@@ -0,0 +1,5 @@

+# pylint: disable=unused-import
+# flake8: noqa
+# Import any tools which need to be automatically registered here
+from pandas_expression_generator import pandas_expression_generator_function

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+gradio
+agentiq
+langgraph
+aiqtoolkit[langchain]

start.sh ADDED Viewed

	@@ -0,0 +1,11 @@

+#!/bin/bash
+# Run both commands in parallel
+aiq serve --config_file=config.yaml &
+python frontend.py
+# Wait for any to exit (optional)
+wait -n
+# Exit with status of the first failed process
+exit $?