Spaces:

vikramvasudevan
/

sanatan_ai

Running on CPU Upgrade

App Files Files Community

vikramvasudevan commited on Aug 12

Commit

ec6bd64

verified ·

1 Parent(s): d13c5ed

Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

app.py +2 -2
config.py +7 -6
graph_helper.py +16 -8
tools.py +3 -2

app.py CHANGED Viewed

@@ -145,7 +145,7 @@ async def chat_streaming(debug_mode: bool, message, history, thread_id):
         "debug_mode": debug_mode,
         "messages": (history or []) + [{"role": "user", "content": message}],
     }
-    config = {"configurable": {"thread_id": thread_id}}
     start_time = time.time()
     streamed_response = ""
     final_response = ""
@@ -440,7 +440,7 @@ with gr.Blocks(
                         scripture["example_labels"], scripture["examples"]
                     ):
                         btn = gr.Button(value=f"{example_label}", size="sm")
-                        btn.click(close_side_bar,outputs=[sidebar]).then(
                             populate_chat_input,
                             inputs=[gr.State(example_text)],
                             outputs=[message_textbox],

         "debug_mode": debug_mode,
         "messages": (history or []) + [{"role": "user", "content": message}],
     }
+    config = {"configurable": {"thread_id": thread_id}, "recursion_limit": 15}
     start_time = time.time()
     streamed_response = ""
     final_response = ""
                         scripture["example_labels"], scripture["examples"]
                     ):
                         btn = gr.Button(value=f"{example_label}", size="sm")
+                        btn.click(close_side_bar, outputs=[sidebar]).then(
                             populate_chat_input,
                             inputs=[gr.State(example_text)],
                             outputs=[message_textbox],

config.py CHANGED Viewed

@@ -178,12 +178,13 @@ class SanatanConfig:
                 {
                     "name": "title",
                     "datatype": "str",
-                    "description": ("Title of this pasuram."
-                    "Use this when a specific prabandham code or name is given along with a relative verse number."
-                    "for example:\n"
-                    "- `TVM 1.8.3`\n"
-                    "- '3rd pasuram in the 8th Thiruvaimozhi of the 1st decade.' - you must convert this representation to the format '{prabandham_code} {nth_decade}.{nth_chapter}.{nth_pasuram}'\n"
-                    "If no decade is provided, assume decade = 1"
                     ),
                 },
                 {

                 {
                     "name": "title",
                     "datatype": "str",
+                    "description": (
+                        "Title of this pasuram."
+                        "Use this when a specific prabandham code or name is given along with a relative verse number."
+                        "for example:\n"
+                        "- `TVM 1.8.3`\n"
+                        "- if the user query is 'give me 3rd pasuram in the 8th Thiruvaimozhi of the 1st decade.' - you must convert this representation to the format '{prabandham_code} {nth_decade}.{nth_chapter}.{nth_pasuram}' and pass as filter vaoue to the `title` field. \n"
+                        "If no decade is provided but a prabandham name is provided, assume decade = 1"
                     ),
                 },
                 {

graph_helper.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from typing import Annotated, TypedDict
 from langgraph.graph import StateGraph, START, END
 from langgraph.checkpoint.memory import MemorySaver
@@ -5,6 +6,7 @@ from langgraph.graph.message import add_messages
 from langchain_openai import ChatOpenAI
 from langgraph.graph.state import CompiledStateGraph
 from langchain_core.messages import AIMessage
 from tools import (
     tool_format_scripture_answer,
     tool_get_standardized_prabandham_names,
@@ -25,15 +27,17 @@ logger.setLevel(logging.INFO)
 class ChatState(TypedDict):
-    debug_mode : bool = True
     messages: Annotated[list[str], add_messages]
 def check_debug_condition(state: ChatState) -> str:
     if state["debug_mode"]:
         return "validator"
     else:
         return "__end__"
 def branching_condition(state: ChatState) -> str:
     last_message = state["messages"][-1]
     if hasattr(last_message, "tool_calls") and last_message.tool_calls:
@@ -188,6 +192,9 @@ Where:
         if not already_has_prompt:
             messages += [
                 SystemMessage(
                     content="⚠️ Do NOT summarize or compress the output from the `query` tool. It will be passed directly to `format_scripture_answer` tool that formats the answer **AS IS**. DO NOT REMOVE SANSKRIT/TAMIL TEXTS"
                 ),
@@ -197,7 +204,11 @@ Where:
                 SystemMessage(
                     content="For general scripture queries, always prefer semantic search (tool_search_db). Use metadata or literal search only if the user specifies an exact verse number, azhwar, divya desam or phrase."
                 ),
-                SystemMessage(content="""
                         When using tools, you may call the same tool multiple times in a single task ONLY if:
                         1. Each call has materially different arguments or targets a different piece of missing information.
                         2. You have a clear reason for another call that is explicitly based on the new results you just received.
@@ -207,7 +218,8 @@ Where:
                         Before each new call to the same tool, compare the planned arguments with your previous call(s).
                         If they are essentially the same, do NOT call it again — instead, proceed to generate the final validated output.
-                """)
             ]
         return {"messages": messages}
@@ -223,11 +235,7 @@ Where:
     graph.add_conditional_edges(
         "llm",
         branching_condition,
-        {
-            "tools": "tools",
-            "validator": "validator",
-            "__end__" : END
-        },
     )
     graph.add_edge("tools", "llm")
     graph.add_edge("validator", END)

+import json
 from typing import Annotated, TypedDict
 from langgraph.graph import StateGraph, START, END
 from langgraph.checkpoint.memory import MemorySaver
 from langchain_openai import ChatOpenAI
 from langgraph.graph.state import CompiledStateGraph
 from langchain_core.messages import AIMessage
+from config import SanatanConfig
 from tools import (
     tool_format_scripture_answer,
     tool_get_standardized_prabandham_names,
 class ChatState(TypedDict):
+    debug_mode: bool = True
     messages: Annotated[list[str], add_messages]
 def check_debug_condition(state: ChatState) -> str:
     if state["debug_mode"]:
         return "validator"
     else:
         return "__end__"
 def branching_condition(state: ChatState) -> str:
     last_message = state["messages"][-1]
     if hasattr(last_message, "tool_calls") and last_message.tool_calls:
         if not already_has_prompt:
             messages += [
+                SystemMessage(
+                    content=f"Here is the list of all scriptures along with their metadata configuraiton:\n{json.dumps(SanatanConfig.scriptures, indent=1)}\n"
+                ),
                 SystemMessage(
                     content="⚠️ Do NOT summarize or compress the output from the `query` tool. It will be passed directly to `format_scripture_answer` tool that formats the answer **AS IS**. DO NOT REMOVE SANSKRIT/TAMIL TEXTS"
                 ),
                 SystemMessage(
                     content="For general scripture queries, always prefer semantic search (tool_search_db). Use metadata or literal search only if the user specifies an exact verse number, azhwar, divya desam or phrase."
                 ),
+                SystemMessage(
+                    content="you must ALWAYS call one of the standardization tools available to get the correct entity name before using the `tool_search_db_by_metadata` tool."
+                ),
+                SystemMessage(
+                    content="""
                         When using tools, you may call the same tool multiple times in a single task ONLY if:
                         1. Each call has materially different arguments or targets a different piece of missing information.
                         2. You have a clear reason for another call that is explicitly based on the new results you just received.
                         Before each new call to the same tool, compare the planned arguments with your previous call(s).
                         If they are essentially the same, do NOT call it again — instead, proceed to generate the final validated output.
+                """
+                ),
             ]
         return {"messages": messages}
     graph.add_conditional_edges(
         "llm",
         branching_condition,
+        {"tools": "tools", "validator": "validator", "__end__": END},
     )
     graph.add_edge("tools", "llm")
     graph.add_edge("validator", END)

tools.py CHANGED Viewed

@@ -47,10 +47,12 @@ tool_search_db_for_literal = StructuredTool.from_function(
 tool_search_db_by_metadata = StructuredTool.from_function(
     query_by_metadata_field,
     description=(
-        "Use this tool **only when the user provides explicit metadata criteria**, such as: azhwar name, pasuram number, verse number, prabandham name, or divya desam name."
         " This is not meant for general queries."
         f" The collection_name must be one of: {', '.join(allowed_collections)}."
         "If the user asks for a specific azhwar, use `tool_get_standardized_azhwar_names` first."
         "If the user asks for a specific prabandham, use `tool_get_standardized_prabandham_names` first."
         "If the user mentions a divya desam, use `tool_get_standardized_divya_desam_names` first."
@@ -60,7 +62,6 @@ tool_search_db_by_metadata = StructuredTool.from_function(
         For example, if the tool returns Thirumālirum Solai, you must pass that exact string to tool_search_db_by_metadata. Do not change it to Thirumalirum Solai, Tirumalirumsolai, or anything else.
         🔍 This is critical for the search to return results correctly.
         🚫 Any deviation will cause the search to fail or miss results."""
-        f" Reference config:\n{json.dumps(SanatanConfig.scriptures, indent=1)}\n"
     ),
 )

 tool_search_db_by_metadata = StructuredTool.from_function(
     query_by_metadata_field,
+    name="tool_search_db_by_metadata",
     description=(
+        "Use this tool **only when the user provides explicit metadata criteria**, such as: azhwar name, pasuram number, verse number, decade, prabandham name, or divya desam name."
         " This is not meant for general queries."
         f" The collection_name must be one of: {', '.join(allowed_collections)}."
+        "you must ALWAYS call one of the standardization tools available to get the correct entity name before using this tool."
         "If the user asks for a specific azhwar, use `tool_get_standardized_azhwar_names` first."
         "If the user asks for a specific prabandham, use `tool_get_standardized_prabandham_names` first."
         "If the user mentions a divya desam, use `tool_get_standardized_divya_desam_names` first."
         For example, if the tool returns Thirumālirum Solai, you must pass that exact string to tool_search_db_by_metadata. Do not change it to Thirumalirum Solai, Tirumalirumsolai, or anything else.
         🔍 This is critical for the search to return results correctly.
         🚫 Any deviation will cause the search to fail or miss results."""
     ),
 )