Spaces:

kevinhug
/

ai

Running

App Files Files Community

kevinhug commited on 3 days ago

Commit

9bac96a

1 Parent(s): e79f773

label

Browse files

Files changed (3) hide show

app.py +126 -0
classify.py +24 -16
judge.py +1 -2

app.py CHANGED Viewed

@@ -478,6 +478,132 @@ Once created, knowledge graphs can be repurposed across multiple use cases (e.g.
     btn_recommend = gr.Button("Classify & Evaluation")
     btn_recommend.click(fn=judge, inputs=in_verbatim, outputs=out_product)
     gr.Markdown("""
 Benefits of Multi Class Classification
 ==================
 - Precision Decision-Making

     btn_recommend = gr.Button("Classify & Evaluation")
     btn_recommend.click(fn=judge, inputs=in_verbatim, outputs=out_product)
     gr.Markdown("""
+Example Output
+===========
+```
+{
+  "texts": [
+    "\"The online portal makes managing my mortgage payments so convenient.\"",
+    "\"RBC offer great mortgage for my home with competitive rate thank you\"",
+    "\"Low interest rate compared to other cards I’ve used. Highly recommend for responsible spenders.\"",
+    "\"The mobile check deposit feature saves me so much time. Banking made easy!\"",
+    "\"Affordable premiums with great coverage. Switched from my old provider and saved!\""
+  ],
+  "predictions": [
+    [
+      {
+        "chain_of_thought": [
+          "The customer mentions managing mortgage payments online, which directly relates to the 'online' tag.",
+          "There is no mention or implication of card, cars, insurance, or any other tags in the text."
+        ],
+        "name": "online",
+        "id": 0,
+        "confidence": 1.0
+      }
+    ],
+    [
+      {
+        "chain_of_thought": [
+          "The customer explicitly mentions 'mortgage for my home', which directly corresponds to the tag name 'mortgage'.",
+          "There is no mention of online, card, cars, or insurance in the text.",
+          "Therefore, we can confidently apply the mortgage tag."
+        ],
+        "name": "mortgage",
+        "id": 3,
+        "confidence": 1.0
+      }
+    ],
+    [
+      {
+        "chain_of_thought": [
+          "The customer mentions a low interest rate and compares it to other cards they have used. This indicates the text is related to a card product.",
+          "There is no mention of online services, cars, mortgage, or insurance in the text."
+        ],
+        "name": "card",
+        "id": 1,
+        "confidence": 0.9
+      }
+    ],
+    [
+      {
+        "chain_of_thought": [
+          "The customer explicitly mentions the mobile check deposit feature which is related to online banking services.",
+          "There is a Tag with id 0 named 'online' that matches the content of the text."
+        ],
+        "name": "online",
+        "id": 0,
+        "confidence": 1.0
+      }
+    ],
+    [
+      {
+        "chain_of_thought": [
+          "The customer mentions 'premiums' and 'coverage', which are related to insurance products. There is a tag named 'insurance' with id 4, so we can
+tag this text with 'insurance'.",
+          "There's no mention of online services, cards, cars, or mortgages in the text."
+        ],
+        "name": "insurance",
+        "id": 4,
+        "confidence": 0.9
+      }
+    ]
+  ],
+  "judgment": [
+    [
+      {
+        "thought": "The reasoning states that the customer mentioned managing mortgage payments online. The answer provided is 'online'. Since the context
+explicitly stated that the topic was about online management, it logically follows that 'online' would be the correct and relevant response.",
+        "justification": "The reasoning directly connects the mention of 'managing mortgage payments online' to the answer 'online', making the logic sound
+. There are no other tags or concepts mentioned that could have influenced this answer, so the connection is clear and valid.",
+        "logical": true
+      }
+    ],
+    [
+      {
+        "thought": "<thought>Given that the reasoning explicitly states 'mortgage for my home' and directly corresponds to the tag name 'mortgage', and the
+re's no mention of other financial products like online, card, cars, or insurance, it is logical to conclude that the answer 'mortgage' is correct. The con
+text provided supports this by not contradicting the reasoning.</thought>",
+        "justification": "<justification>The reasoning clearly states a direct match between the customer's statement and the tag name 'mortgage'. There ar
+e no conflicting elements in the text, making the connection sound and valid. Therefore, it is logical that the answer 'mortgage' is relevant to the given
+context.</justification>",
+        "logical": true
+      }
+    ],
+    [
+      {
+        "thought": "<thought>Given that the reasoning states there's a low interest rate mentioned and comparison to other cards, it logically follows that
+ 'card' would be an appropriate answer. The context, although incomplete, aligns with the reasoning as it pertains to card products.</thought>",
+        "justification": "<justification>The reasoning correctly identifies the topic of discussion (cards) based on key phrases like 'low interest rate' a
+nd 'comparison to other cards'. Since the answer provided is 'card', which directly corresponds to this context, the logical connection between the reasoni
+ng and the answer is valid.</justification>",
+        "logical": true
+      }
+    ],
+    [
+      {
+        "thought": "The reasoning states that the customer mentioned the mobile check deposit feature, which is related to online banking services. The con
+text provided a tag with id '0' named 'online', and the answer given is 'online'. This directly matches the content of the text, making it relevant.",
+        "justification": "Since the context provides a clear connection between the customer's mention of mobile check deposit (related to online banking)
+and the tag 'online', the answer 'online' is logically derived from this reasoning. The direct match in terms of content makes the logical link valid and s
+ound.",
+        "logical": true
+      }
+    ],
+    [
+      {
+        "thought": "<thought> The reasoning states that the context mentions 'premiums' and 'coverage', which are related to insurance. It also notes the p
+resence of an 'insurance' tag with id 4, suggesting this should be tagged as such. The answer provided is 'insurance', directly matching the reasoning's co
+nclusion. There is no mention in the text or reasoning that contradicts this.</thought>",
+        "justification": "<justification> The reasoning and the answer are logically consistent because they both point to the same key term, 'insurance'.
+The presence of relevant terms like 'premiums' and 'coverage', along with the explicit tag reference, support a logical connection between the context and
+the answer. There is no indication that any other services or products mentioned in the reasoning (like online services, cards, cars, or mortgages) are pre
+sent in the text.</justification>",
+        "logical": true
+      }
+    ]
+  ]
+}
+```
 Benefits of Multi Class Classification
 ==================
 - Precision Decision-Making

classify.py CHANGED Viewed

@@ -8,12 +8,11 @@ import os
 from groq import AsyncGroq
-# Initialize with API key
-client = AsyncGroq(api_key=os.getenv("GROQ_API_KEY"))
 # Enable instructor patches for Groq client
-client = instructor.from_groq(client)
-"""
 import openai
 client = instructor.from_openai(
     openai.AsyncOpenAI(
@@ -22,7 +21,7 @@ client = instructor.from_openai(
     ),
     mode=instructor.Mode.JSON,
 )
-"""
 llm = 'llama-3.1-8b-instant' if os.getenv("GROQ_API_KEY") else "qwen2.5" #"gemma3:12b" #"llama3.2" #"deepseek-r1"
@@ -35,9 +34,10 @@ class Tag(BaseModel):
         default=0.5,
         ge=0,
         le=1,
-        description="The confidence of the prediction(id, name) for the text, 0 is low, 1 is high",examples=[0.5,0.1,0.9]
     )
     @field_validator('confidence', mode="after")
     @classmethod
     def high_confidence(cls, c:float):
@@ -45,6 +45,7 @@ class Tag(BaseModel):
       if c < 0.6:
           raise ValueError(f"low confidence `{c}` ")
       return c
     @model_validator(mode="after")
     def validate_ids(self, info: ValidationInfo):
@@ -109,16 +110,20 @@ async def tag_single_request(text: str, tags: List[Tag]) -> Iterable[Tag]:
         messages=[
           {
             "role": "system",
-            "content": """You are a world-class text tagging system for customer feedback in the banking industry to classify banking product/services.
-  """
           },
-          {"role": "user", "content": f"""Create minimum multiple Tag according to instruction most appropriate for the following text: `{text}`
-            ### Instruction:
             Here are the allowed Tag(id, name), do not use any other Tag than these: {allowed_tags_str}
             Tag the name based on fact stated and directly mention in the text. Do not guess the name, Do not tag if tag not mention in the text. Do not use implication.
             Calculate the newly created Tag's confidence that Tag  fit to the text
             For each question, show your step-by-step thinking under 'chain_of_thought' in list of string, then clearly state your final answer under 'name'.
             """ },
         ],
@@ -134,19 +139,24 @@ async def tag_request(request: TagRequest) -> TagResponse:
   predictions = await asyncio.gather(
     *[tag_single_request(text, request.tags) for text in request.texts]
   )
   pred_dedup=[]
   for tags in predictions:
     if tags is not None:
       dedup=[]
-      #filter(lambda x: x.confidence > 0.7, tags)
-      tags_s=sorted(tags, key=lambda x: (x.name, x.confidence))
       if len(tags_s)>0:
         dedup.append(tags_s[0])
         for j in range(1,len(tags_s)):
           if tags_s[j-1].name!=tags_s[j].name:
             dedup.append(tags_s[j])
-      pred_dedup.append(dedup)
     else:
       pred_dedup.append(None)
@@ -166,11 +176,9 @@ tags = [
 texts = """
-"The online portal makes managing my mortgage payments so convenient."
-;"RBC offer great mortgage for my home with competitive rate thank you";
 "Low interest rate compared to other cards I’ve used. Highly recommend for responsible spenders.";
 "The mobile check deposit feature saves me so much time. Banking made easy!";
-"Affordable premiums with great coverage. Switched from my old provider and saved!"
 """
 def judge_response(response):

 from groq import AsyncGroq
 # Enable instructor patches for Groq client
+#client = instructor.from_groq(AsyncGroq(api_key=os.getenv("GROQ_API_KEY")))
+'''
 import openai
 client = instructor.from_openai(
     openai.AsyncOpenAI(
     ),
     mode=instructor.Mode.JSON,
 )
+'''
 llm = 'llama-3.1-8b-instant' if os.getenv("GROQ_API_KEY") else "qwen2.5" #"gemma3:12b" #"llama3.2" #"deepseek-r1"
         default=0.5,
         ge=0,
         le=1,
+        description="The confidence of the prediction(id, name) for the text, 0 is low, 1 is high"
     )
+    """
     @field_validator('confidence', mode="after")
     @classmethod
     def high_confidence(cls, c:float):
       if c < 0.6:
           raise ValueError(f"low confidence `{c}` ")
       return c
+    """
     @model_validator(mode="after")
     def validate_ids(self, info: ValidationInfo):
         messages=[
           {
             "role": "system",
+            "content": """You are a world-class text tagging system for customer feedback in the banking industry to classify banking product/services. """
           },
+          {"role": "user", "content": f"""Create minimum multiple Tag according to instruction most appropriate for the following text:
+            < Text >
+            {text}
+            </ Text>
+            < Instruction >
             Here are the allowed Tag(id, name), do not use any other Tag than these: {allowed_tags_str}
             Tag the name based on fact stated and directly mention in the text. Do not guess the name, Do not tag if tag not mention in the text. Do not use implication.
             Calculate the newly created Tag's confidence that Tag  fit to the text
             For each question, show your step-by-step thinking under 'chain_of_thought' in list of string, then clearly state your final answer under 'name'.
+            </ Instruction >
             """ },
         ],
   predictions = await asyncio.gather(
     *[tag_single_request(text, request.tags) for text in request.texts]
   )
   pred_dedup=[]
   for tags in predictions:
     if tags is not None:
       dedup=[]
+      #filter(lambda x: x>5, range(10))
+      t=list(filter(lambda x: x.confidence > 0.7, [tag async for tag in tags]))
+      #tags_s=set((n.name) for n in t) #sorted(t, key=lambda x: (x.name, x.confidence))
+      pred_dedup.append(t)
+      """
       if len(tags_s)>0:
         dedup.append(tags_s[0])
         for j in range(1,len(tags_s)):
           if tags_s[j-1].name!=tags_s[j].name:
             dedup.append(tags_s[j])
+      """
     else:
       pred_dedup.append(None)
 texts = """
+"The online portal makes managing my mortgage payments so convenient.";
 "Low interest rate compared to other cards I’ve used. Highly recommend for responsible spenders.";
 "The mobile check deposit feature saves me so much time. Banking made easy!";
 """
 def judge_response(response):

judge.py CHANGED Viewed

@@ -8,10 +8,9 @@ import os
 from groq import AsyncGroq
 # Initialize with API key
-client = AsyncGroq(api_key=os.getenv("GROQ_API_KEY"))
 # Enable instructor patches for Groq client
-client = instructor.from_groq(client)
 """
 client = instructor.from_openai(

 from groq import AsyncGroq
 # Initialize with API key
 # Enable instructor patches for Groq client
+client = instructor.from_groq(AsyncGroq(api_key=os.getenv("GROQ_API_KEY")))
 """
 client = instructor.from_openai(