File size: 6,155 Bytes
70e373f
 
56890f7
70e373f
 
 
 
 
 
 
 
 
 
 
 
 
 
df22a7e
70e373f
 
 
 
 
 
 
 
1d56a59
51faed1
546fac2
daf16cc
 
 
 
 
 
 
 
 
 
 
 
70e373f
657d5be
daf16cc
51faed1
ad67ce6
daf16cc
70e373f
 
 
 
f46456d
1094158
ff06efe
1094158
5f18f6e
 
821a5c8
000aa92
 
 
 
5f18f6e
70e373f
ad67ce6
ff06efe
5f18f6e
70e373f
29128dc
161ebae
1094158
41aed73
70e373f
 
 
 
aeb68b2
70e373f
58bca32
ff06efe
42c2b3f
1afd562
 
ff4d113
ff06efe
4718b38
1afd562
42c2b3f
ff06efe
1afd562
 
42c2b3f
161ebae
a461ac6
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
from transformers import AutoModelForSequenceClassification
from transformers import AutoTokenizer, AutoConfig
from clean_data import cleaned_complaints
import numpy as np
from scipy.special import softmax
import gradio as gr

# Preprocess text (username and link placeholders)
def preprocess(text):
    new_text = []
    for t in text.split(" "):
        t = '@user' if t.startswith('@') and len(t) > 1 else t
        t = 'http' if t.startswith('http') else t
        new_text.append(t)
    return " ".join(new_text)

# load model
MODEL = f"ThirdEyeData/Consumer-Complaint-Categorization"
model = AutoModelForSequenceClassification.from_pretrained(MODEL)
#model.save_pretrained(MODEL)


tokenizer = AutoTokenizer.from_pretrained(MODEL)
config = AutoConfig.from_pretrained(MODEL)

# create classifier function
def classify_compliant(text):
      text = cleaned_complaints(text)
      if len(text)<3:
          return "Cannot Categorize the Complaint"
      else:
          text = preprocess(text)
          encoded_input = tokenizer(text, return_tensors='pt')
          output = model(**encoded_input)
          scores = output[0][0].detach().numpy()
          scores = softmax(scores)

          # Print labels and scores
          probs = {}
          ranking = np.argsort(scores)
          ranking = ranking[::-1]

  
          l = config.id2label[ranking[0]]
        #s = scores[ranking[i]]
    #probs[l] = np.round(float(s), 4)
          return l


#build the Gradio app
#Instructuction = "Write an imaginary review about a product or service you might be interested in."
title="Customer Complaints Categorization"
description = """This application uses fine-tune BERT to perform Customer Complaints Categorization. BERT models are usually pretrained on a large corpus of text and then fine tuned for specific tasks.
Effectively handling customer complaints provides an opportunity for the service provider to resolve the customer’s problems on time and thus reduce dissatisfaction levels.

Write a complaint on an insurance product or service and see how the machine learning model is able to Categorisation your Complaint.
The Complaints Type are:
1. Debt Collection 
2. False Claim or Statement
3. Legal Issue
4. Improper contact or sharing of info
5. Follow Up Issue
"""
article = """
            - Click submit button to test Consumer Complaint Segmentation
            - Click the clear button to refresh the text
            - This application has a linked model https://huggingface.co/ThirdEyeData/Consumer-Complaint-Categorization 
           """

demo = gr.Interface(classify_compliant,
            inputs=gr.Textbox(lines =10,label = "Type your Complaint of our Product here or for a quick demo click on the examples provided below and output will automatically be populated in the output box ", max_lines = 20),
            outputs = gr.Textbox(lines =5,label = "Complaint Category"),
            title = title,
            description = description,
            #Instruction = Instructuction,
            article = article,
            #allow_flagging = "never",
            live = False,
            cache_example = False,
            examples=[["""The day before my Salliemae student loan payment was due I contacted a rep to discuss the impact on my account of making my payment at the end of the month rather than the middle for just that one month. 
            The rep indicated it would be no problem, but that I still may get a call  each day from Salliemae until I made my payment. I understood, requested my account be notated accordingly, and hung up. For two weeks I endured numerous calls per day ; 
            I lost count at six calls one day, which was the norm for the number of calls Salliemae made in an effort to collect a debt that had a due date that had been arranged and had not come up yet. """],
            ["""The representative told me the total amount due was {$2100.00} and that I can settle for half of that amount. Unfortunately, I was unable to accept the settlement but began to question the amount because my last statement was {$1800.00} and
            there was nothing written in the contract for additional interest charges should my account go into collection. 
            I told the representative that I will pay the amount actually owed and I want to make a payment arrangement. She told me I can't just do what I want, 
            If I want to pay the original amount due, it has to be paid in full. I told her that that is not fair debt collection practice and that I am only contractually obligated to the {$1800.00} and we can set up an arrangement from that. """] ,
             ["""This debt is beyond the Maryland Statute of Limitations. It is illegal for a debt collector to collect on an expired debt. They have taken illegal action by seizing my Maryland State Refund when the debt had already expired and beyond the Statute of Limitation which is 3 years in the state of Maryland"""],
              ["""The company  has been calling my employer in an attempt to collect a debt. When I spoke with them and informed them that this was not an appropriate number to call. I asked what company they were calling from and a phone number so he told me the company name,  but the man on the phone would not give me his name or a phone number. 
             I had mailed a letter requesting verification a few weeks ago and hadn't received anything back. In the letter I specifically requested that all communication be done through mail."""],
             [""" I do n't think I chose the correct issue above, however I think it is closest to my issue. I have a record on my credit report that I have disputed through both the company and the credit bureaus. The dispute is marked as being disputed by me on my report, but it was not removed despite the creditor not sending me verification of this debt.
             I do not even know what this debt is for.I have tried contacting the collection agency by mail to obtain verification with no response and they will not remove the item from my report."""]]
                
             )
if __name__ == "__main__":
    demo.launch()