{ "cells": [ { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np" ] }, { "cell_type": "code", "execution_count": 16, "metadata": {}, "outputs": [], "source": [ "# data loading\n", "data = pd.read_csv('data//Combined_Data.csv')" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Unnamed: 0 | \n", "statement | \n", "status | \n", "
---|---|---|---|
0 | \n", "0 | \n", "oh my gosh | \n", "Anxiety | \n", "
1 | \n", "1 | \n", "trouble sleeping, confused mind, restless hear... | \n", "Anxiety | \n", "
2 | \n", "2 | \n", "All wrong, back off dear, forward doubt. Stay ... | \n", "Anxiety | \n", "
3 | \n", "3 | \n", "I've shifted my focus to something else but I'... | \n", "Anxiety | \n", "
4 | \n", "4 | \n", "I'm restless and restless, it's been a month n... | \n", "Anxiety | \n", "
\n", " | statement | \n", "status | \n", "
---|---|---|
0 | \n", "oh my gosh | \n", "Anxiety | \n", "
1 | \n", "trouble sleeping, confused mind, restless hear... | \n", "Anxiety | \n", "
2 | \n", "All wrong, back off dear, forward doubt. Stay ... | \n", "Anxiety | \n", "
3 | \n", "I've shifted my focus to something else but I'... | \n", "Anxiety | \n", "
4 | \n", "I'm restless and restless, it's been a month n... | \n", "Anxiety | \n", "
\n", " | statement | \n", "status | \n", "cleaned_statement | \n", "
---|---|---|---|
0 | \n", "oh my gosh | \n", "Anxiety | \n", "oh gosh | \n", "
1 | \n", "trouble sleeping, confused mind, restless hear... | \n", "Anxiety | \n", "trouble sleeping confused mind restless heart ... | \n", "
2 | \n", "All wrong, back off dear, forward doubt. Stay ... | \n", "Anxiety | \n", "wrong back dear forward doubt stay restless re... | \n", "
3 | \n", "I've shifted my focus to something else but I'... | \n", "Anxiety | \n", "ive shifted focus something else im still worried | \n", "
4 | \n", "I'm restless and restless, it's been a month n... | \n", "Anxiety | \n", "im restless restless month boy mean | \n", "
\n", " | cleaned_statement | \n", "status | \n", "
---|---|---|
0 | \n", "oh gosh | \n", "Anxiety | \n", "
1 | \n", "trouble sleeping confused mind restless heart ... | \n", "Anxiety | \n", "
2 | \n", "wrong back dear forward doubt stay restless re... | \n", "Anxiety | \n", "
3 | \n", "ive shifted focus something else im still worried | \n", "Anxiety | \n", "
4 | \n", "im restless restless month boy mean | \n", "Anxiety | \n", "
\n", " | cleaned_statement | \n", "status | \n", "
---|---|---|
0 | \n", "oh gosh | \n", "0 | \n", "
1 | \n", "trouble sleeping confused mind restless heart ... | \n", "0 | \n", "
2 | \n", "wrong back dear forward doubt stay restless re... | \n", "0 | \n", "
3 | \n", "ive shifted focus something else im still worried | \n", "0 | \n", "
4 | \n", "im restless restless month boy mean | \n", "0 | \n", "
RandomForestClassifier()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
RandomForestClassifier()
Pipeline(steps=[('preprocessor', TextPreprocessor()),\n", " ('vectorizer', TfidfVectorizer()),\n", " ('classifier', RandomForestClassifier())])In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
Pipeline(steps=[('preprocessor', TextPreprocessor()),\n", " ('vectorizer', TfidfVectorizer()),\n", " ('classifier', RandomForestClassifier())])
TextPreprocessor()
TfidfVectorizer()
RandomForestClassifier()