SearchGPT

Running

Shreyas094 commited on Jul 20, 2024

Commit

0bd56d6

verified ·

1 Parent(s): 2982f30

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -42,39 +42,33 @@ class Agent1:
                 text.strip().endswith('?') or
                 any(word in self.question_words for word in words))
-    def find_noun_phrases(self, sentence):
         tokens = nltk.pos_tag(word_tokenize(sentence))
-        noun_phrases = []
-        current_phrase = []
         for word, tag in tokens:
             if tag.startswith('NN'):
-                current_phrase.append(word)
-            elif current_phrase:
-                noun_phrases.append(' '.join(current_phrase))
-                current_phrase = []
-        if current_phrase:
-            noun_phrases.append(' '.join(current_phrase))
-        return noun_phrases
     def replace_pronoun(self, questions: List[str]) -> List[str]:
         if len(questions) < 2:
             return questions
-        # Find noun phrases in the first question
-        noun_phrases = self.find_noun_phrases(questions[0])
-        if not noun_phrases:
             return questions
-        # Use the last noun phrase as the antecedent
-        antecedent = noun_phrases[-1]
         # Replace pronouns in subsequent questions
         for i in range(1, len(questions)):
             words = word_tokenize(questions[i])
             for j, word in enumerate(words):
                 if word.lower() in self.pronouns:
-                    words[j] = antecedent
             questions[i] = ' '.join(words)
         return questions

                 text.strip().endswith('?') or
                 any(word in self.question_words for word in words))
+    def find_subject(self, sentence):
         tokens = nltk.pos_tag(word_tokenize(sentence))
+        subject = None
         for word, tag in tokens:
             if tag.startswith('NN'):
+                subject = word
+                break
+            if tag == 'IN':  # Stop at preposition
+                break
+        return subject
     def replace_pronoun(self, questions: List[str]) -> List[str]:
         if len(questions) < 2:
             return questions
+        # Find the subject in the first question
+        subject = self.find_subject(questions[0])
+        if not subject:
             return questions
         # Replace pronouns in subsequent questions
         for i in range(1, len(questions)):
             words = word_tokenize(questions[i])
             for j, word in enumerate(words):
                 if word.lower() in self.pronouns:
+                    words[j] = subject
             questions[i] = ' '.join(words)
         return questions