{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "**Importing Libraries**" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "_cell_guid": "b1076dfc-b9ad-4769-8c92-a6c4dae69d19", "_uuid": "8f2839f25d086af736a60e9eeb907d3b93b6e0e5" }, "outputs": [], "source": [ "import numpy as np # linear algebra\n", "import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)\n", "import ast\n", "import operator\n", "from textblob import TextBlob\n", "import pandas as pd\n", "import re\n", "import nltk\n", "from nltk import pos_tag\n", "from nltk.tokenize import word_tokenize\n", "from nltk.corpus import stopwords\n", "from nltk.stem.porter import PorterStemmer\n", "from nltk.stem import LancasterStemmer, WordNetLemmatizer\n", "import re, string, unicodedata\n", "import warnings\n", "warnings.filterwarnings(\"ignore\")" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "**Loading Dataset**" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | User_id | \n", "Product_id | \n", "Rating | \n", "Date | \n", "Review | \n", "Label | \n", "
---|---|---|---|---|---|---|
0 | \n", "923 | \n", "0 | \n", "3 | \n", "12/8/2014 | \n", "The food at snack is a selection of popular Gr... | \n", "-1 | \n", "
1 | \n", "924 | \n", "0 | \n", "3 | \n", "5/16/2013 | \n", "This little place in Soho is wonderful. I had ... | \n", "-1 | \n", "
2 | \n", "925 | \n", "0 | \n", "4 | \n", "7/1/2013 | \n", "ordered lunch for 15 from Snack last Friday. Â... | \n", "-1 | \n", "
3 | \n", "926 | \n", "0 | \n", "4 | \n", "7/28/2011 | \n", "This is a beautiful quaint little restaurant o... | \n", "-1 | \n", "
4 | \n", "927 | \n", "0 | \n", "4 | \n", "11/1/2010 | \n", "Snack is great place for a  casual sit down l... | \n", "-1 | \n", "
\n", " | User_id | \n", "Product_ID | \n", "Rating | \n", "Date | \n", "Reviews | \n", "Label | \n", "Review_Id | \n", "
---|---|---|---|---|---|---|---|
347072 | \n", "56118 | \n", "247 | \n", "5 | \n", "1/6/2015 | \n", "So good, if very slightly salty. No outside fo... | \n", "0 | \n", "347072 | \n", "
347073 | \n", "45392 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "I'm a fan of Ramen (tried Ippudo first in 2010... | \n", "0 | \n", "347073 | \n", "
347074 | \n", "157682 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "I LOVE their pulled pork. It's absolutely deli... | \n", "0 | \n", "347074 | \n", "
347075 | \n", "100734 | \n", "247 | \n", "3 | \n", "1/5/2015 | \n", "I ordered the modern ramen with black garlic s... | \n", "0 | \n", "347075 | \n", "
347076 | \n", "56506 | \n", "247 | \n", "5 | \n", "1/5/2015 | \n", "What? You haven't been to Ippudo yet? *slaps f... | \n", "0 | \n", "347076 | \n", "
\n", " | User_id | \n", "Product_ID | \n", "Rating | \n", "Date | \n", "Reviews | \n", "Label | \n", "Review_Id | \n", "Original Reviews | \n", "Features | \n", "Sentiment | \n", "
---|---|---|---|---|---|---|---|---|---|---|
347072 | \n", "56118 | \n", "247 | \n", "5 | \n", "1/6/2015 | \n", "good slightly salty outside food reservations ... | \n", "0 | \n", "347072 | \n", "So good, if very slightly salty. No outside fo... | \n", "[food reservations] | \n", "Positive | \n", "
347073 | \n", "45392 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "fan ramen tried ippudo first 2010 ramen option... | \n", "0 | \n", "347073 | \n", "I'm a fan of Ramen (tried Ippudo first in 2010... | \n", "[fan ramen, ramen options, fair portion pay, a... | \n", "Positive | \n", "
347074 | \n", "157682 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "love pulled pork absolutely delicious mustget ... | \n", "0 | \n", "347074 | \n", "I LOVE their pulled pork. It's absolutely deli... | \n", "[delicious mustget, service food good eel rice... | \n", "Positive | \n", "
347075 | \n", "100734 | \n", "247 | \n", "3 | \n", "1/5/2015 | \n", "ordered modern ramen black garlic sauce pretty... | \n", "0 | \n", "347075 | \n", "I ordered the modern ramen with black garlic s... | \n", "[modern ramen, black garlic sauce, pretty good... | \n", "Positive | \n", "
347076 | \n", "56506 | \n", "247 | \n", "5 | \n", "1/5/2015 | \n", "nt ippudo yet slaps face go best restaurant wo... | \n", "0 | \n", "347076 | \n", "What? You haven't been to Ippudo yet? *slaps f... | \n", "[nt ippudo, restaurant world bye] | \n", "Positive | \n", "
\n", " | User_id | \n", "Product_ID | \n", "Rating | \n", "Date | \n", "Reviews | \n", "Label | \n", "Review_Id | \n", "Original Reviews | \n", "Features | \n", "Sentiment | \n", "
---|---|---|---|---|---|---|---|---|---|---|
347094 | \n", "157688 | \n", "247 | \n", "1 | \n", "12/29/2014 | \n", "well u want quoted 2 hour wait think lot well ... | \n", "0 | \n", "347094 | \n", "Well if u want to be quoted 2 hour wait and th... | \n", "[horses bc, awful nt] | \n", "Negative | \n", "
347099 | \n", "13270 | \n", "247 | \n", "1 | \n", "12/28/2014 | \n", "ippudo rated restaurant nyc area year 2014 sma... | \n", "0 | \n", "347099 | \n", "IPPUDO is the most rated restaurant in the nyc... | \n", "[restaurant nyc area year, small review, veget... | \n", "Negative | \n", "
347117 | \n", "157697 | \n", "247 | \n", "3 | \n", "12/20/2014 | \n", "place overated wait long food pricey running l... | \n", "0 | \n", "347117 | \n", "This place is overated. Â The wait was long an... | \n", "[food pricey, nt seat friend, party friend lie... | \n", "Negative | \n", "
347127 | \n", "157699 | \n", "247 | \n", "3 | \n", "12/15/2014 | \n", "place used five star place us recently cut bac... | \n", "0 | \n", "347127 | \n", "This place used to be a five star place for us... | \n", "[star place, portion size, rid pork, ramen nt,... | \n", "Negative | \n", "
347148 | \n", "75089 | \n", "247 | \n", "3 | \n", "12/5/2014 | \n", "came way st marks ippudo ramen average quality... | \n", "0 | \n", "347148 | \n", "Came all the way to St. marks just for ippudo.... | \n", "[st marks ippudo ramen average quality, ramen ... | \n", "Negative | \n", "
\n", " | User_id | \n", "Product_ID | \n", "Rating | \n", "Date | \n", "Reviews | \n", "Label | \n", "Review_Id | \n", "Original Reviews | \n", "Features | \n", "Sentiment | \n", "
---|---|---|---|---|---|---|---|---|---|---|
347072 | \n", "56118 | \n", "247 | \n", "5 | \n", "1/6/2015 | \n", "good slightly salty outside food reservations ... | \n", "0 | \n", "347072 | \n", "So good, if very slightly salty. No outside fo... | \n", "[food reservations] | \n", "Positive | \n", "
347073 | \n", "45392 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "fan ramen tried ippudo first 2010 ramen option... | \n", "0 | \n", "347073 | \n", "I'm a fan of Ramen (tried Ippudo first in 2010... | \n", "[fan ramen, ramen options, fair portion pay, a... | \n", "Positive | \n", "
347074 | \n", "157682 | \n", "247 | \n", "4 | \n", "1/6/2015 | \n", "love pulled pork absolutely delicious mustget ... | \n", "0 | \n", "347074 | \n", "I LOVE their pulled pork. It's absolutely deli... | \n", "[delicious mustget, service food good eel rice... | \n", "Positive | \n", "
347075 | \n", "100734 | \n", "247 | \n", "3 | \n", "1/5/2015 | \n", "ordered modern ramen black garlic sauce pretty... | \n", "0 | \n", "347075 | \n", "I ordered the modern ramen with black garlic s... | \n", "[modern ramen, black garlic sauce, pretty good... | \n", "Positive | \n", "
347076 | \n", "56506 | \n", "247 | \n", "5 | \n", "1/5/2015 | \n", "nt ippudo yet slaps face go best restaurant wo... | \n", "0 | \n", "347076 | \n", "What? You haven't been to Ippudo yet? *slaps f... | \n", "[nt ippudo, restaurant world bye] | \n", "Positive | \n", "
\n", " | User_id | \n", "Product_ID | \n", "Rating | \n", "Date | \n", "Reviews | \n", "Label | \n", "Review_Id | \n", "Original Reviews | \n", "Features | \n", "Sentiment | \n", "
---|---|---|---|---|---|---|---|---|---|---|
347359 | \n", "98585 | \n", "247 | \n", "5 | \n", "9/25/2014 | \n", "pork buns ftw | \n", "0 | \n", "347359 | \n", "pork buns ftw. | \n", "[pork buns ftw] | \n", "Neutral | \n", "
347364 | \n", "157774 | \n", "247 | \n", "5 | \n", "9/24/2014 | \n", "holy vegetarian ramen | \n", "0 | \n", "347364 | \n", "Holy vegetarian ramen. | \n", "[vegetarian ramen] | \n", "Neutral | \n", "
347399 | \n", "157792 | \n", "247 | \n", "4 | \n", "9/14/2014 | \n", "pork buns die | \n", "0 | \n", "347399 | \n", "the pork buns are to die for!! | \n", "[pork buns] | \n", "Neutral | \n", "
347418 | \n", "7946 | \n", "247 | \n", "4 | \n", "9/9/2014 | \n", "pork buns tho | \n", "0 | \n", "347418 | \n", "those pork buns tho. | \n", "[pork buns tho] | \n", "Neutral | \n", "
347426 | \n", "7765 | \n", "247 | \n", "4 | \n", "9/7/2014 | \n", "yummmmmmmmm | \n", "0 | \n", "347426 | \n", "Yummmmmmmmm | \n", "[] | \n", "Neutral | \n", "
\n", " | Date | \n", "Features | \n", "Label | \n", "Original Reviews | \n", "Product_ID | \n", "Rating | \n", "Review_Id | \n", "Reviews | \n", "Sentiment | \n", "User_id | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "8/20/2013 | \n", "[ramen ippudo, amazing things ippudo, great re... | \n", "0 | \n", "To be honest, I was pretty disappointed by the... | \n", "247 | \n", "3 | \n", "348937 | \n", "honest pretty disappointed ramen ippudo prior ... | \n", "Positive | \n", "28644 | \n", "
1 | \n", "4/14/2010 | \n", "[hrs trendy, expensive kind ramen place, side ... | \n", "0 | \n", "Expect a LONG wait. Â Average wait for dinner ... | \n", "247 | \n", "4 | \n", "352584 | \n", "expect long wait average wait dinner usually 4... | \n", "Positive | \n", "29778 | \n", "
2 | \n", "11/11/2012 | \n", "[place fav restaurant visit, new york, 630pm f... | \n", "0 | \n", "I'll add my 2 cents to the other 4000 reviews.... | \n", "247 | \n", "5 | \n", "349848 | \n", "add 2 cents 4000 reviews love place fav restau... | \n", "Positive | \n", "158470 | \n", "
3 | \n", "12/24/2013 | \n", "[visit ippudo disappoint, thursday afternoon w... | \n", "0 | \n", "My latest visit to Ippudo did not disappoint. ... | \n", "247 | \n", "4 | \n", "348461 | \n", "latest visit ippudo disappoint came thursday a... | \n", "Positive | \n", "10151 | \n", "
4 | \n", "11/8/2013 | \n", "[okay course, ramen places nyc visit, reviews ... | \n", "0 | \n", "Okay.. Of course I have to try one of the best... | \n", "247 | \n", "4 | \n", "348626 | \n", "okay course try one best ramen places nyc visi... | \n", "Positive | \n", "95663 | \n", "
5 | \n", "1/9/2011 | \n", "[reviews speaks, fan ramen broth, smooth thirs... | \n", "0 | \n", "Hands down, the best ramen I have yet tasted! ... | \n", "247 | \n", "5 | \n", "351816 | \n", "hands best ramen yet tasted 2000 reviews speak... | \n", "Positive | \n", "158880 | \n", "
6 | \n", "3/14/2010 | \n", "[new york, recommendation coworker, ramen nood... | \n", "0 | \n", "I went here while visiting my sister in New Yo... | \n", "247 | \n", "5 | \n", "352688 | \n", "went visiting sister new york got recommendati... | \n", "Positive | \n", "159063 | \n", "
7 | \n", "3/6/2011 | \n", "[review place year, accident bat shit, crazy i... | \n", "0 | \n", "So this place is growing on me. Â I swore I wr... | \n", "247 | \n", "4 | \n", "351591 | \n", "place growing swore wrote review place year ag... | \n", "Positive | \n", "11968 | \n", "
8 | \n", "9/12/2012 | \n", "[ippudo list, name cringe, previous reviews ex... | \n", "0 | \n", "Ippudo should be a on a list called \"Yelp's Mo... | \n", "247 | \n", "2 | \n", "349980 | \n", "ippudo list called yelp overrated reviews ever... | \n", "Negative | \n", "18712 | \n", "
9 | \n", "4/19/2011 | \n", "[wednesday night, ramen place, worth wait, ca ... | \n", "0 | \n", "We waited for about an hour to get seats one W... | \n", "247 | \n", "3 | \n", "351409 | \n", "waited hour get seats one wednesday night last... | \n", "Negative | \n", "158807 | \n", "
10 | \n", "9/21/2010 | \n", "[ippudo review, ramen places area making decis... | \n", "0 | \n", "I have been sitting on this Ippudo review, wai... | \n", "247 | \n", "2 | \n", "352178 | \n", "sitting ippudo review waiting try ramen places... | \n", "Negative | \n", "45628 | \n", "
11 | \n", "12/4/2008 | \n", "[email faithful foodie friends notify, concur ... | \n", "0 | \n", "so. i was craving for ramen yesterday. shit ha... | \n", "247 | \n", "2 | \n", "353503 | \n", "craving ramen yesterday shit happens know emai... | \n", "Negative | \n", "30068 | \n", "
12 | \n", "2/12/2014 | \n", "[mmhmm refund, subway system, ippudo ny 310pm,... | \n", "0 | \n", "Over-hyped? Yes, totally. Overpriced? Mmhmm!!!... | \n", "247 | \n", "1 | \n", "348240 | \n", "overhyped yes totally overpriced mmhmm refund ... | \n", "Negative | \n", "158054 | \n", "
13 | \n", "7/26/2011 | \n", "[true ippudo japan hint hintif ippudo japan, p... | \n", "0 | \n", "I was torn between giving Ippudo 1 star or 2 s... | \n", "247 | \n", "1 | \n", "351107 | \n", "torn giving ippudo 1 star 2 stars wish could g... | \n", "Negative | \n", "115992 | \n", "
14 | \n", "4/4/2010 | \n", "[pork bun, pork bun akamaru, pork bun, expecta... | \n", "0 | \n", "Pork bun! 4**** I got the pork bun and the Aka... | \n", "247 | \n", "4 | \n", "352621 | \n", "pork bun 4 got pork bun akamaru modern first b... | \n", "Negative | \n", "72285 | \n", "
15 | \n", "12/28/2009 | \n", "[trip ippudo monday december, good meal, awful... | \n", "0 | \n", "Just got back from my first trip to Ippudo (Mo... | \n", "247 | \n", "1 | \n", "352894 | \n", "got back first trip ippudo monday december 28t... | \n", "Negative | \n", "4447 | \n", "
16 | \n", "2/15/2014 | \n", "[ramen delicious, pork buns] | \n", "0 | \n", "Ramen is delicious. Try the pork buns THe wait... | \n", "247 | \n", "4 | \n", "348232 | \n", "ramen delicious try pork buns wait insane | \n", "Neutral | \n", "127760 | \n", "
17 | \n", "12/6/2013 | \n", "[worth wait, tables empty, sister sister nt, p... | \n", "0 | \n", "Not worth the wait. I went here few times and ... | \n", "247 | \n", "1 | \n", "348525 | \n", "worth wait went times waited 2 hours first tim... | \n", "Neutral | \n", "79801 | \n", "
18 | \n", "8/3/2010 | \n", "[faint webster hall, hot bowl ramen, cold wet ... | \n", "0 | \n", "What can I say - after seeing Ladytron and the... | \n", "247 | \n", "5 | \n", "352312 | \n", "say seeing ladytron faint webster hall nothing... | \n", "Neutral | \n", "158981 | \n", "
19 | \n", "12/19/2012 | \n", "[line nt, pork buns bowl noodles, 1030am satur... | \n", "0 | \n", "I don't like waiting in line, and I don't like... | \n", "247 | \n", "4 | \n", "349740 | \n", "nt like waiting line nt like sitting strangers... | \n", "Neutral | \n", "7015 | \n", "