diff --git "a/Week13_\353\263\265\354\212\265\352\263\274\354\240\234_\354\236\245\354\204\234\354\227\260.ipynb" "b/Week13_\353\263\265\354\212\265\352\263\274\354\240\234_\354\236\245\354\204\234\354\227\260.ipynb" new file mode 100644 index 0000000..3775fed --- /dev/null +++ "b/Week13_\353\263\265\354\212\265\352\263\274\354\240\234_\354\236\245\354\204\234\354\227\260.ipynb" @@ -0,0 +1,1294 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [] + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "markdown", + "source": [ + "# 8.10장 캐글 Mercari Price Suggestion Challenge\n", + "\n", + "회귀로 피처 학습 ➡️ price 예측\n", + "\n", + "**📌 피처들 ( 정형 + 비정형 )**\n", + "\n", + "\n", + "* train_id : 데이터 id\n", + "* name : 제품명\n", + "\n", + "* item_condition_id : 판매자가 제공하는 제품 상태\n", + "\n", + "* category_name : 카테고리 명\n", + "* brand_name : 브랜드명\n", + "\n", + "\n", + "\n", + "* shipping : 배송비 무료 여부 (1 - 무료, 0 - 유료 )\n", + "\n", + "\n", + "* item_description : 제품 설명\n", + "\n", + "\n", + "* price : 제품 가격 ( target )\n" + ], + "metadata": { + "id": "DP6KtuAn0XmT" + } + }, + { + "cell_type": "markdown", + "source": [ + "## 데이터 전처리\n", + "\n", + "###📌 결측치\n", + "- brand_name : 결측치 多 849853 non-null\n", + "- category_name : 결측치 6300\n", + "- item_description : 4\n", + "\n", + "###📌 회귀에서 target값 정규 분포도 매우 중요\n", + "- price log변환\n", + "\n", + "###📌 피처 불균형 확인\n", + "- shipping : 비교적 균일\n", + "- item_condition_id : 1,2,3이 주, No description yet 변경 필요\n", + "\n", + "###📌 단어 토큰화\n", + "- category_name : / 기준 단어 토큰화, 별도 피처 저장 ➡️ split_cat()" + ], + "metadata": { + "id": "pFT9NTl72LuM" + } + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 311 + }, + "id": "nrPKjOrt0CJO", + "outputId": "9f1b654e-ed51-4673-fe3c-21aa21f4d9f5" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "(1482535, 8)\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " train_id name item_condition_id \\\n", + "0 0 MLB Cincinnati Reds T Shirt Size XL 3 \n", + "1 1 Razer BlackWidow Chroma Keyboard 3 \n", + "2 2 AVA-VIV Blouse 1 \n", + "3 3 Leather Horse Statues 1 \n", + "4 4 24K GOLD plated rose 1 \n", + "\n", + " category_name brand_name price \\\n", + "0 Men/Tops/T-shirts NaN 10.0 \n", + "1 Electronics/Computers & Tablets/Components & P... Razer 52.0 \n", + "2 Women/Tops & Blouses/Blouse Target 10.0 \n", + "3 Home/Home Décor/Home Décor Accents NaN 35.0 \n", + "4 Women/Jewelry/Necklaces NaN 44.0 \n", + "\n", + " shipping item_description \n", + "0 1 No description yet \n", + "1 0 This keyboard is in great condition and works ... \n", + "2 1 Adorable top with a hint of lace and a key hol... \n", + "3 1 New with tags. Leather horses. Retail for [rm]... \n", + "4 0 Complete with certificate of authenticity " + ], + "text/html": [ + "\n", + "
| \n", + " | train_id | \n", + "name | \n", + "item_condition_id | \n", + "category_name | \n", + "brand_name | \n", + "price | \n", + "shipping | \n", + "item_description | \n", + "
|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "0 | \n", + "MLB Cincinnati Reds T Shirt Size XL | \n", + "3 | \n", + "Men/Tops/T-shirts | \n", + "NaN | \n", + "10.0 | \n", + "1 | \n", + "No description yet | \n", + "
| 1 | \n", + "1 | \n", + "Razer BlackWidow Chroma Keyboard | \n", + "3 | \n", + "Electronics/Computers & Tablets/Components & P... | \n", + "Razer | \n", + "52.0 | \n", + "0 | \n", + "This keyboard is in great condition and works ... | \n", + "
| 2 | \n", + "2 | \n", + "AVA-VIV Blouse | \n", + "1 | \n", + "Women/Tops & Blouses/Blouse | \n", + "Target | \n", + "10.0 | \n", + "1 | \n", + "Adorable top with a hint of lace and a key hol... | \n", + "
| 3 | \n", + "3 | \n", + "Leather Horse Statues | \n", + "1 | \n", + "Home/Home Décor/Home Décor Accents | \n", + "NaN | \n", + "35.0 | \n", + "1 | \n", + "New with tags. Leather horses. Retail for [rm]... | \n", + "
| 4 | \n", + "4 | \n", + "24K GOLD plated rose | \n", + "1 | \n", + "Women/Jewelry/Necklaces | \n", + "NaN | \n", + "44.0 | \n", + "0 | \n", + "Complete with certificate of authenticity | \n", + "
| \n", + " | price | \n", + "
|---|---|
| 0 | \n", + "2.397895 | \n", + "
| 1 | \n", + "3.970292 | \n", + "
| 2 | \n", + "2.397895 | \n", + "
| 3 | \n", + "3.583519 | \n", + "
| 4 | \n", + "3.806662 | \n", + "
| \n", + " | 0 | \n", + "
|---|---|
| train_id | \n", + "0 | \n", + "
| name | \n", + "0 | \n", + "
| item_condition_id | \n", + "0 | \n", + "
| category_name | \n", + "0 | \n", + "
| brand_name | \n", + "0 | \n", + "
| price | \n", + "0 | \n", + "
| shipping | \n", + "0 | \n", + "
| item_description | \n", + "0 | \n", + "
| cat_dae | \n", + "0 | \n", + "
| cat_jung | \n", + "0 | \n", + "
| cat_so | \n", + "0 | \n", + "
| \n", + " | item_description | \n", + "
|---|---|
| 0 | \n", + "No description yet | \n", + "
| 1 | \n", + "This keyboard is in great condition and works like it came out of the box. All of the ports are tested and work perfectly. The lights are customizable via the Razer Synapse app on your PC. | \n", + "
LatentDirichletAllocation(n_components=8, random_state=0)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LatentDirichletAllocation(n_components=8, random_state=0)
| \n", + " | filename | \n", + "opinion_text | \n", + "
|---|---|---|
| 0 | \n", + "updates_garmin_nuvi_255W_gps | \n", + "Another thing to consider was that I paid $50 less for the 750 and it came with the FM transmitter cable and a USB cord to connect it to your computer for updates and downloads .\\n0 update and reroute much _more_ quickly than my other GPS .\\n1 UPDATE ON THIS , It finally turned out that to see the elevation contours at lowe... | \n", + "
| 1 | \n", + "voice_garmin_nuvi_255W_gps | \n", + "The voice prompts and maps are wonderful especially when driving after dark .\\n0 I also thought the the voice prompts of the 750 where more pleasant sounding than the 255w's .\\n1 ... | \n", + "
| 2 | \n", + "speed_windows7 | \n", + "Windows 7 is quite simply faster, more stable, boots faster, goes to sleep faster, comes back from sleep faster, manages your files better and on top of that it's beautiful to look at and easy to use .\\n0 , faster about 20% to 30% faster at running applications than my Vista , seriously\\n1 ... | \n", + "
| 3 | \n", + "video_ipod_nano_8gb | \n", + "I bought the 8, gig Ipod Nano that has the built, in video camera .\\n0 Itunes has an on, line store, where you may purchase and download music and videos which will install onto the ipod .\\n1 ... | \n", + "
| 4 | \n", + "staff_bestwestern_hotel_sfo | \n", + "Staff are friendl... | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 0 | \n", + "updates_garmin_nuvi_255W_gps | \n", + "Another thing to consider was that I paid $50 less for the 750 and it came with the FM transmitter cable and a USB cord to connect it to your computer for updates and downloads .\\n0 update and reroute much _more_ quickly than my other GPS .\\n1 UPDATE ON THIS , It finally turned out that to see the elevation contours at lowe... | \n", + "2 | \n", + "
| 1 | \n", + "voice_garmin_nuvi_255W_gps | \n", + "The voice prompts and maps are wonderful especially when driving after dark .\\n0 I also thought the the voice prompts of the 750 where more pleasant sounding than the 255w's .\\n1 ... | \n", + "2 | \n", + "
| 2 | \n", + "speed_windows7 | \n", + "Windows 7 is quite simply faster, more stable, boots faster, goes to sleep faster, comes back from sleep faster, manages your files better and on top of that it's beautiful to look at and easy to use .\\n0 , faster about 20% to 30% faster at running applications than my Vista , seriously\\n1 ... | \n", + "1 | \n", + "
| 3 | \n", + "video_ipod_nano_8gb | \n", + "I bought the 8, gig Ipod Nano that has the built, in video camera .\\n0 Itunes has an on, line store, where you may purchase and download music and videos which will install onto the ipod .\\n1 ... | \n", + "2 | \n", + "
| 4 | \n", + "staff_bestwestern_hotel_sfo | \n", + "Staff are friendl... | \n", + "0 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 44 | \n", + "bathroom_bestwestern_hotel_sfo | \n", + "The room was not overly big, but clean and very comfortable beds, a great shower and very clean bathrooms .\\n0 The second room was smaller, with a very inconvenient bathroom layout, but at least it was quieter and we were able to sleep .\\n1 ... | \n", + "0 | \n", + "
| 32 | \n", + "food_holiday_inn_london | \n", + "The room was packed to capacity with queues at the food buffets .\\n0 The over zealous staff cleared our unfinished drinks while we were collecting cooked food and movement around the room with plates was difficult in the crowded circumstances .\\n1 ... | \n", + "0 | \n", + "
| 33 | \n", + "food_swissotel_chicago | \n", + "The food for our event was delicious .\\n0 ... | \n", + "0 | \n", + "
| 37 | \n", + "free_bestwestern_hotel_sfo | \n", + "The wine reception is a great idea as it is nice to meet other travellers and great having access to the free Internet access in our room .\\n0 They also have a computer available with free internet which is a nice bonus but I didn't find that out till the day before we left but was still able to get on there to check our flight to Vegas the next day .\\n1 ... | \n", + "0 | \n", + "
| 35 | \n", + "location_bestwestern_hotel_sfo | \n", + "Good Value good location , ideal choice .\\n0 Great Location , Nice Rooms , Helpless Concierge\\n1 ... | \n", + "0 | \n", + "
| 27 | \n", + "location_holiday_inn_london | \n", + "Great location for tube and we crammed in a fair amount of sightseeing in a short time .\\n0 All in all, a normal chain hotel on a nice lo... | \n", + "0 | \n", + "
| 29 | \n", + "parking_bestwestern_hotel_sfo | \n", + "Parking was expensive but I think this is common for San Fran .\\n0 there is a fee for parking but well worth it seeing no where to park if you do have a car .\\n1 ... | \n", + "0 | \n", + "
| 25 | \n", + "price_holiday_inn_london | \n", + "All in all, a normal chain hotel on a nice location , I will be back if I do not find anthing closer to Picadilly for a better price .\\n0 ... | \n", + "0 | \n", + "
| 22 | \n", + "room_holiday_inn_london | \n", + "We arrived at 23,30 hours and they could not recommend a restaurant so we decided to go to Tesco, with very limited choices but when you are hingry you do not careNext day they rang the bell at 8,00 hours to clean the room, not being very nice being waken up so earlyEvery day they gave u... | \n", + "0 | \n", + "
| 23 | \n", + "rooms_bestwestern_hotel_sfo | \n", + "Great Location , Nice Rooms , H... | \n", + "0 | \n", + "
| 17 | \n", + "rooms_swissotel_chicago | \n", + "The Swissotel is one of our favorite hotels in Chicago and the corner rooms have the most fantastic views in the city .\\n0 The rooms look like they were just remodled and upgraded, there was an HD TV and a nice iHome docking station to put my iPod so I could set the alarm to wake up with my music instead of the radio .\\n1 ... | \n", + "0 | \n", + "
| 8 | \n", + "service_bestwestern_hotel_sfo | \n", + "Both of us having worked in tourism for over 14 years were very disappointed at the level of service provided by this gentleman .\\n0 The service was good, very friendly staff and we loved the free wine reception each night .\\n1 ... | \n", + "0 | \n", + "
| 12 | \n", + "service_holiday_inn_london | \n", + "not customer, oriented hotelvery low service levelboor reception\\n0 The room was quiet, clean, the bed and pillows were comfortable, and the serv... | \n", + "0 | \n", + "
| 7 | \n", + "service_swissotel_hotel_chicago | \n", + "Mediocre room and service for a very extravagant price .\\n0 ... | \n", + "0 | \n", + "
| 4 | \n", + "staff_bestwestern_hotel_sfo | \n", + "Staff are friendl... | \n", + "0 | \n", + "
| 5 | \n", + "staff_swissotel_chicago | \n", + "The staff at Swissotel were not particularly nice .\\n0 Each time I waited at the counter for staff for several minutes and then was waved to the desk upon my turn with no hello or anything, or apology for waiting in line .\\n1 ... | \n", + "0 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 28 | \n", + "keyboard_netbook_1005ha | \n", + ", I think the new keyboard rivals the great hp mini keyboards .\\n0 Since the battery life difference is minimum, the only reason to upgrade would be to get the better keyboard .\\n1 The keyboard is now as good as t... | \n", + "1 | \n", + "
| 10 | \n", + "size_asus_netbook_1005ha | \n", + "A few other things I'd like to point out is that you must push the micro, sized right angle end of the ac adapter until it snaps in place or the battery may not charge .\\n0 The full size right shift k... | \n", + "1 | \n", + "
| 2 | \n", + "speed_windows7 | \n", + "Windows 7 is quite simply faster, more stable, boots faster, goes to sleep faster, comes back from sleep faster, manages your files better and on top of that it's beautiful to look at and easy to use .\\n0 , faster about 20% to 30% faster at running applications than my Vista , seriously\\n1 ... | \n", + "1 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 46 | \n", + "accuracy_garmin_nuvi_255W_gps | \n", + ", and is very, very accurate .\\n0 but for the most part, we find that the Garmin software provides accurate directions, whereever we intend to go .\\n1 This functi... | \n", + "2 | \n", + "
| 42 | \n", + "directions_garmin_nuvi_255W_gps | \n", + "You also get upscale features like spoken directions including street names and programmable POIs .\\n0 I used to hesitate to go out of my directions but no... | \n", + "2 | \n", + "
| 48 | \n", + "display_garmin_nuvi_255W_gps | \n", + "3 quot widescreen display was a bonus .\\n0 This made for smoother graphics on the 255w of the vehicle moving along displayed roads, where the 750's display was more of a jerky movement .\\n1 ... | \n", + "2 | \n", + "
| 38 | \n", + "eyesight-issues_amazon_kindle | \n", + "It feels as easy to read as the K1 but doesn't seem any crisper to my eyes .\\n0 the white is really GREY, and to avoid considerable eye, strain I had to refresh pages every other page .\\n1 The dream has always been a portable electronic device that could hold a ton of reading material, automate subscriptions and fa... | \n", + "2 | \n", + "
| 40 | \n", + "features_windows7 | \n", + "I had to uninstall anti, virus and selected other programs, some of which did not have listings in the Programs and Features Control Panel section .\\n0 This review briefly touches upon some of the key features and enhancements of Microsoft's latest OS .\\n1 ... | \n", + "2 | \n", + "
| 34 | \n", + "fonts_amazon_kindle | \n", + "Being able to change the font sizes is awesome !\\n0 For whatever reason, Amazon decided to make the Font on the Home Screen ... | \n", + "2 | \n", + "
| 30 | \n", + "navigation_amazon_kindle | \n", + "In fact, the entire navigation structure has been completely revised , I'm still getting used to it but it's a huge step forward .\\n0 ... | \n", + "2 | \n", + "
| 15 | \n", + "satellite_garmin_nuvi_255W_gps | \n", + "It's fast to acquire satellites .\\n0 If you've ever had a Brand X GPS take you on some strange route that adds 20 minutes to your trip, has you turn the wrong way down a one way road, tell you to turn AFTER you've passed the street, frequently loses the satellite signal, or has old maps missing streets, you know how important this stuff is .\\n1 ... | \n", + "2 | \n", + "
| 21 | \n", + "screen_garmin_nuvi_255W_gps | \n", + "It is easy to read and when touching the screen it works great !\\n0 and zoom out buttons on the 255w to the same side of the screen which makes it a bit easier .\\n1 ... | \n", + "2 | \n", + "
| 16 | \n", + "screen_ipod_nano_8gb | \n", + "As always, the video screen is sharp and bright .\\n0 2, inch screen and a glossy, polished aluminum finish that one CNET editor described as looking like a Christmas tree ornament .\\n1 ... | \n", + "2 | \n", + "
| 14 | \n", + "screen_netbook_1005ha | \n", + "Keep in mind that once you get in a room full of light or step outdoors screen reflections could become annoying .\\n0 I've used mine outsi... | \n", + "2 | \n", + "
| 11 | \n", + "speed_garmin_nuvi_255W_gps | \n", + "Another feature on the 255w is a display of the posted speed limit on the road which you are currently on right above your current displayed speed .\\n0 I found myself not even looking at my car speedometer as I could easily see my current speed and the speed limit of my route at a glance .\\n1 ... | \n", + "2 | \n", + "
| 0 | \n", + "updates_garmin_nuvi_255W_gps | \n", + "Another thing to consider was that I paid $50 less for the 750 and it came with the FM transmitter cable and a USB cord to connect it to your computer for updates and downloads .\\n0 update and reroute much _more_ quickly than my other GPS .\\n1 UPDATE ON THIS , It finally turned out that to see the elevation contours at lowe... | \n", + "2 | \n", + "
| 3 | \n", + "video_ipod_nano_8gb | \n", + "I bought the 8, gig Ipod Nano that has the built, in video camera .\\n0 Itunes has an on, line store, where you may purchase and download music and videos which will install onto the ipod .\\n1 ... | \n", + "2 | \n", + "
| 1 | \n", + "voice_garmin_nuvi_255W_gps | \n", + "The voice prompts and maps are wonderful especially when driving after dark .\\n0 I also thought the the voice prompts of the 750 where more pleasant sounding than the 255w's .\\n1 ... | \n", + "2 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 45 | \n", + "battery-life_amazon_kindle | \n", + "After I plugged it in to my USB hub on my computer to charge the battery the charging cord design is very clever !\\n0 After you have paged tru a 500, page book one, page, at, a, time to get from Chapter 2 to Chapter 15, see how excited you are about a low battery and all the time it took to get there !\\n1 ... | \n", + "3 | \n", + "
| 47 | \n", + "battery-life_ipod_nano_8gb | \n", + "short battery life I moved up from an 8gb .\\n0 I love this ipod except for the battery life .\\n1 ... | \n", + "3 | \n", + "
| 50 | \n", + "battery-life_netbook_1005ha | \n", + "6GHz 533FSB cpu, glossy display, 3, Cell 23Wh Li, ion Battery , and a 1 .\\n0 Not to mention that as of now... | \n", + "3 | \n", + "
| 49 | \n", + "buttons_amazon_kindle | \n", + "I thought it would be fitting to christen my Kindle with the Stephen King novella UR, so went to the Amazon site on my computer and clicked on the button to buy it .\\n0 As soon as I'd clicked the button to confirm my order it appeared on my Kindle almost immediately !\\n1 ... | \n", + "3 | \n", + "
| 20 | \n", + "performance_netbook_1005ha | \n", + "The Eee Super Hybrid Engine utility lets users overclock or underclock their Eee PC's to boost performance or provide better battery life depending on their immediate requirements .\\n0 In Super Performance mode CPU, Z shows the bus speed to increase up to 169 .\\n1 One... | \n", + "3 | \n", + "
| 19 | \n", + "price_amazon_kindle | \n", + "If a case was included, as with the Kindle 1, that would have been reflected in a higher price .\\n0 lower overall price, with nice leather cover .\\n1 ... | \n", + "3 | \n", + "
| 13 | \n", + "sound_ipod_nano_8gb | \n", + "headphone jack i got a clear case for it and it i got a clear case for it and it like prvents me from being able to put the jack all the way in so the sound can b messsed up or i can get it in there and its playing well them go to move or something and it slides out .\\n0 Picture and sound quality are excellent for this typ of devic .\\n1 ... | \n", + "3 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 41 | \n", + "comfort_honda_accord_2008 | \n", + "Drivers seat not comfortable, the car itself compared to other models of similar class .\\n0 ... | \n", + "4 | \n", + "
| 43 | \n", + "comfort_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 Seats are fine, in fact of all the smaller sedans this is the most comfortable I found for the price as I am 6', 2 and 250# .\\n1 Great gas mileage and comfortable on long trips ... | \n", + "4 | \n", + "
| 39 | \n", + "gas_mileage_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 ... | \n", + "4 | \n", + "
| 36 | \n", + "interior_honda_accord_2008 | \n", + "I love the new body style and the interior is a simple pleasure except for the center dash .\\n0 ... | \n", + "4 | \n", + "
| 26 | \n", + "interior_toyota_camry_2007 | \n", + "First of all, the interior has way too many cheap plastic parts like the cheap plastic center piece that houses the clock .\\n0 3 blown struts at 30,000 miles, interior trim coming loose and rattling squeaking, stains on paint, and bug splats taking paint off, premature uneven brake wear, on 3rd windsh... | \n", + "4 | \n", + "
| 31 | \n", + "mileage_honda_accord_2008 | \n", + "It's quiet, get good gas mileage and looks clean inside and out .\\n0 The mileage is great, and I've had to get used to stopping less for gas .\\n1 Thought gas ... | \n", + "4 | \n", + "
| 18 | \n", + "performance_honda_accord_2008 | \n", + "Very happy with my 08 Accord, performance is quite adequate it has nice looks and is a great long, distance cruiser .\\n0 6, 4, 3 eco engine has poor performance and gas mileage of 22 highway .\\n1 Overall performance is good but comfort level is poor .\\n2 ... | \n", + "4 | \n", + "
| 24 | \n", + "quality_toyota_camry_2007 | \n", + "I previously owned a Toyota 4Runner which had incredible build quality and reliability .\\n0 I bought the Camry because of Toyota reliability and qua... | \n", + "4 | \n", + "
| 9 | \n", + "seats_honda_accord_2008 | \n", + "Front seats are very uncomfortable .\\n0 No memory seats, no trip computer, can only display outside temp with trip odometer .\\n1 ... | \n", + "4 | \n", + "
| 6 | \n", + "transmission_toyota_camry_2007 | \n", + "After slowing down, transmission has to be kicked to speed up .\\n0 ... | \n", + "4 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 5 | \n", + "staff_swissotel_chicago | \n", + "The staff at Swissotel were not particularly nice .\\n0 Each time I waited at the counter for staff for several minutes and then was waved to the desk upon my turn with no hello or anything, or apology for waiting in line .\\n1 ... | \n", + "0 | \n", + "
| 7 | \n", + "service_swissotel_hotel_chicago | \n", + "Mediocre room and service for a very extravagant price .\\n0 ... | \n", + "0 | \n", + "
| 4 | \n", + "staff_bestwestern_hotel_sfo | \n", + "Staff are friendl... | \n", + "0 | \n", + "
| 8 | \n", + "service_bestwestern_hotel_sfo | \n", + "Both of us having worked in tourism for over 14 years were very disappointed at the level of service provided by this gentleman .\\n0 The service was good, very friendly staff and we loved the free wine reception each night .\\n1 ... | \n", + "0 | \n", + "
| 12 | \n", + "service_holiday_inn_london | \n", + "not customer, oriented hotelvery low service levelboor reception\\n0 The room was quiet, clean, the bed and pillows were comfortable, and the serv... | \n", + "0 | \n", + "
| 22 | \n", + "room_holiday_inn_london | \n", + "We arrived at 23,30 hours and they could not recommend a restaurant so we decided to go to Tesco, with very limited choices but when you are hingry you do not careNext day they rang the bell at 8,00 hours to clean the room, not being very nice being waken up so earlyEvery day they gave u... | \n", + "0 | \n", + "
| 23 | \n", + "rooms_bestwestern_hotel_sfo | \n", + "Great Location , Nice Rooms , H... | \n", + "0 | \n", + "
| 17 | \n", + "rooms_swissotel_chicago | \n", + "The Swissotel is one of our favorite hotels in Chicago and the corner rooms have the most fantastic views in the city .\\n0 The rooms look like they were just remodled and upgraded, there was an HD TV and a nice iHome docking station to put my iPod so I could set the alarm to wake up with my music instead of the radio .\\n1 ... | \n", + "0 | \n", + "
| 25 | \n", + "price_holiday_inn_london | \n", + "All in all, a normal chain hotel on a nice location , I will be back if I do not find anthing closer to Picadilly for a better price .\\n0 ... | \n", + "0 | \n", + "
| 27 | \n", + "location_holiday_inn_london | \n", + "Great location for tube and we crammed in a fair amount of sightseeing in a short time .\\n0 All in all, a normal chain hotel on a nice lo... | \n", + "0 | \n", + "
| 29 | \n", + "parking_bestwestern_hotel_sfo | \n", + "Parking was expensive but I think this is common for San Fran .\\n0 there is a fee for parking but well worth it seeing no where to park if you do have a car .\\n1 ... | \n", + "0 | \n", + "
| 44 | \n", + "bathroom_bestwestern_hotel_sfo | \n", + "The room was not overly big, but clean and very comfortable beds, a great shower and very clean bathrooms .\\n0 The second room was smaller, with a very inconvenient bathroom layout, but at least it was quieter and we were able to sleep .\\n1 ... | \n", + "0 | \n", + "
| 37 | \n", + "free_bestwestern_hotel_sfo | \n", + "The wine reception is a great idea as it is nice to meet other travellers and great having access to the free Internet access in our room .\\n0 They also have a computer available with free internet which is a nice bonus but I didn't find that out till the day before we left but was still able to get on there to check our flight to Vegas the next day .\\n1 ... | \n", + "0 | \n", + "
| 35 | \n", + "location_bestwestern_hotel_sfo | \n", + "Good Value good location , ideal choice .\\n0 Great Location , Nice Rooms , Helpless Concierge\\n1 ... | \n", + "0 | \n", + "
| 33 | \n", + "food_swissotel_chicago | \n", + "The food for our event was delicious .\\n0 ... | \n", + "0 | \n", + "
| 32 | \n", + "food_holiday_inn_london | \n", + "The room was packed to capacity with queues at the food buffets .\\n0 The over zealous staff cleared our unfinished drinks while we were collecting cooked food and movement around the room with plates was difficult in the crowded circumstances .\\n1 ... | \n", + "0 | \n", + "
| 28 | \n", + "keyboard_netbook_1005ha | \n", + ", I think the new keyboard rivals the great hp mini keyboards .\\n0 Since the battery life difference is minimum, the only reason to upgrade would be to get the better keyboard .\\n1 The keyboard is now as good as t... | \n", + "1 | \n", + "
| 41 | \n", + "comfort_honda_accord_2008 | \n", + "Drivers seat not comfortable, the car itself compared to other models of similar class .\\n0 ... | \n", + "1 | \n", + "
| 43 | \n", + "comfort_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 Seats are fine, in fact of all the smaller sedans this is the most comfortable I found for the price as I am 6', 2 and 250# .\\n1 Great gas mileage and comfortable on long trips ... | \n", + "1 | \n", + "
| 24 | \n", + "quality_toyota_camry_2007 | \n", + "I previously owned a Toyota 4Runner which had incredible build quality and reliability .\\n0 I bought the Camry because of Toyota reliability and qua... | \n", + "1 | \n", + "
| 20 | \n", + "performance_netbook_1005ha | \n", + "The Eee Super Hybrid Engine utility lets users overclock or underclock their Eee PC's to boost performance or provide better battery life depending on their immediate requirements .\\n0 In Super Performance mode CPU, Z shows the bus speed to increase up to 169 .\\n1 One... | \n", + "1 | \n", + "
| 10 | \n", + "size_asus_netbook_1005ha | \n", + "A few other things I'd like to point out is that you must push the micro, sized right angle end of the ac adapter until it snaps in place or the battery may not charge .\\n0 The full size right shift k... | \n", + "1 | \n", + "
| 50 | \n", + "battery-life_netbook_1005ha | \n", + "6GHz 533FSB cpu, glossy display, 3, Cell 23Wh Li, ion Battery , and a 1 .\\n0 Not to mention that as of now... | \n", + "1 | \n", + "
| 47 | \n", + "battery-life_ipod_nano_8gb | \n", + "short battery life I moved up from an 8gb .\\n0 I love this ipod except for the battery life .\\n1 ... | \n", + "1 | \n", + "
| 45 | \n", + "battery-life_amazon_kindle | \n", + "After I plugged it in to my USB hub on my computer to charge the battery the charging cord design is very clever !\\n0 After you have paged tru a 500, page book one, page, at, a, time to get from Chapter 2 to Chapter 15, see how excited you are about a low battery and all the time it took to get there !\\n1 ... | \n", + "1 | \n", + "
| 2 | \n", + "speed_windows7 | \n", + "Windows 7 is quite simply faster, more stable, boots faster, goes to sleep faster, comes back from sleep faster, manages your files better and on top of that it's beautiful to look at and easy to use .\\n0 , faster about 20% to 30% faster at running applications than my Vista , seriously\\n1 ... | \n", + "1 | \n", + "
| 9 | \n", + "seats_honda_accord_2008 | \n", + "Front seats are very uncomfortable .\\n0 No memory seats, no trip computer, can only display outside temp with trip odometer .\\n1 ... | \n", + "1 | \n", + "
| 14 | \n", + "screen_netbook_1005ha | \n", + "Keep in mind that once you get in a room full of light or step outdoors screen reflections could become annoying .\\n0 I've used mine outsi... | \n", + "2 | \n", + "
| 3 | \n", + "video_ipod_nano_8gb | \n", + "I bought the 8, gig Ipod Nano that has the built, in video camera .\\n0 Itunes has an on, line store, where you may purchase and download music and videos which will install onto the ipod .\\n1 ... | \n", + "2 | \n", + "
| 1 | \n", + "voice_garmin_nuvi_255W_gps | \n", + "The voice prompts and maps are wonderful especially when driving after dark .\\n0 I also thought the the voice prompts of the 750 where more pleasant sounding than the 255w's .\\n1 ... | \n", + "2 | \n", + "
| 13 | \n", + "sound_ipod_nano_8gb | \n", + "headphone jack i got a clear case for it and it i got a clear case for it and it like prvents me from being able to put the jack all the way in so the sound can b messsed up or i can get it in there and its playing well them go to move or something and it slides out .\\n0 Picture and sound quality are excellent for this typ of devic .\\n1 ... | \n", + "2 | \n", + "
| 11 | \n", + "speed_garmin_nuvi_255W_gps | \n", + "Another feature on the 255w is a display of the posted speed limit on the road which you are currently on right above your current displayed speed .\\n0 I found myself not even looking at my car speedometer as I could easily see my current speed and the speed limit of my route at a glance .\\n1 ... | \n", + "2 | \n", + "
| 31 | \n", + "mileage_honda_accord_2008 | \n", + "It's quiet, get good gas mileage and looks clean inside and out .\\n0 The mileage is great, and I've had to get used to stopping less for gas .\\n1 Thought gas ... | \n", + "2 | \n", + "
| 30 | \n", + "navigation_amazon_kindle | \n", + "In fact, the entire navigation structure has been completely revised , I'm still getting used to it but it's a huge step forward .\\n0 ... | \n", + "2 | \n", + "
| 26 | \n", + "interior_toyota_camry_2007 | \n", + "First of all, the interior has way too many cheap plastic parts like the cheap plastic center piece that houses the clock .\\n0 3 blown struts at 30,000 miles, interior trim coming loose and rattling squeaking, stains on paint, and bug splats taking paint off, premature uneven brake wear, on 3rd windsh... | \n", + "2 | \n", + "
| 21 | \n", + "screen_garmin_nuvi_255W_gps | \n", + "It is easy to read and when touching the screen it works great !\\n0 and zoom out buttons on the 255w to the same side of the screen which makes it a bit easier .\\n1 ... | \n", + "2 | \n", + "
| 19 | \n", + "price_amazon_kindle | \n", + "If a case was included, as with the Kindle 1, that would have been reflected in a higher price .\\n0 lower overall price, with nice leather cover .\\n1 ... | \n", + "2 | \n", + "
| 18 | \n", + "performance_honda_accord_2008 | \n", + "Very happy with my 08 Accord, performance is quite adequate it has nice looks and is a great long, distance cruiser .\\n0 6, 4, 3 eco engine has poor performance and gas mileage of 22 highway .\\n1 Overall performance is good but comfort level is poor .\\n2 ... | \n", + "2 | \n", + "
| 16 | \n", + "screen_ipod_nano_8gb | \n", + "As always, the video screen is sharp and bright .\\n0 2, inch screen and a glossy, polished aluminum finish that one CNET editor described as looking like a Christmas tree ornament .\\n1 ... | \n", + "2 | \n", + "
| 15 | \n", + "satellite_garmin_nuvi_255W_gps | \n", + "It's fast to acquire satellites .\\n0 If you've ever had a Brand X GPS take you on some strange route that adds 20 minutes to your trip, has you turn the wrong way down a one way road, tell you to turn AFTER you've passed the street, frequently loses the satellite signal, or has old maps missing streets, you know how important this stuff is .\\n1 ... | \n", + "2 | \n", + "
| 6 | \n", + "transmission_toyota_camry_2007 | \n", + "After slowing down, transmission has to be kicked to speed up .\\n0 ... | \n", + "2 | \n", + "
| 0 | \n", + "updates_garmin_nuvi_255W_gps | \n", + "Another thing to consider was that I paid $50 less for the 750 and it came with the FM transmitter cable and a USB cord to connect it to your computer for updates and downloads .\\n0 update and reroute much _more_ quickly than my other GPS .\\n1 UPDATE ON THIS , It finally turned out that to see the elevation contours at lowe... | \n", + "2 | \n", + "
| 36 | \n", + "interior_honda_accord_2008 | \n", + "I love the new body style and the interior is a simple pleasure except for the center dash .\\n0 ... | \n", + "2 | \n", + "
| 38 | \n", + "eyesight-issues_amazon_kindle | \n", + "It feels as easy to read as the K1 but doesn't seem any crisper to my eyes .\\n0 the white is really GREY, and to avoid considerable eye, strain I had to refresh pages every other page .\\n1 The dream has always been a portable electronic device that could hold a ton of reading material, automate subscriptions and fa... | \n", + "2 | \n", + "
| 39 | \n", + "gas_mileage_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 ... | \n", + "2 | \n", + "
| 40 | \n", + "features_windows7 | \n", + "I had to uninstall anti, virus and selected other programs, some of which did not have listings in the Programs and Features Control Panel section .\\n0 This review briefly touches upon some of the key features and enhancements of Microsoft's latest OS .\\n1 ... | \n", + "2 | \n", + "
| 42 | \n", + "directions_garmin_nuvi_255W_gps | \n", + "You also get upscale features like spoken directions including street names and programmable POIs .\\n0 I used to hesitate to go out of my directions but no... | \n", + "2 | \n", + "
| 34 | \n", + "fonts_amazon_kindle | \n", + "Being able to change the font sizes is awesome !\\n0 For whatever reason, Amazon decided to make the Font on the Home Screen ... | \n", + "2 | \n", + "
| 46 | \n", + "accuracy_garmin_nuvi_255W_gps | \n", + ", and is very, very accurate .\\n0 but for the most part, we find that the Garmin software provides accurate directions, whereever we intend to go .\\n1 This functi... | \n", + "2 | \n", + "
| 48 | \n", + "display_garmin_nuvi_255W_gps | \n", + "3 quot widescreen display was a bonus .\\n0 This made for smoother graphics on the 255w of the vehicle moving along displayed roads, where the 750's display was more of a jerky movement .\\n1 ... | \n", + "2 | \n", + "
| 49 | \n", + "buttons_amazon_kindle | \n", + "I thought it would be fitting to christen my Kindle with the Stephen King novella UR, so went to the Amazon site on my computer and clicked on the button to buy it .\\n0 As soon as I'd clicked the button to confirm my order it appeared on my Kindle almost immediately !\\n1 ... | \n", + "2 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 45 | \n", + "battery-life_amazon_kindle | \n", + "After I plugged it in to my USB hub on my computer to charge the battery the charging cord design is very clever !\\n0 After you have paged tru a 500, page book one, page, at, a, time to get from Chapter 2 to Chapter 15, see how excited you are about a low battery and all the time it took to get there !\\n1 ... | \n", + "1 | \n", + "
| 47 | \n", + "battery-life_ipod_nano_8gb | \n", + "short battery life I moved up from an 8gb .\\n0 I love this ipod except for the battery life .\\n1 ... | \n", + "1 | \n", + "
| 50 | \n", + "battery-life_netbook_1005ha | \n", + "6GHz 533FSB cpu, glossy display, 3, Cell 23Wh Li, ion Battery , and a 1 .\\n0 Not to mention that as of now... | \n", + "1 | \n", + "
| 41 | \n", + "comfort_honda_accord_2008 | \n", + "Drivers seat not comfortable, the car itself compared to other models of similar class .\\n0 ... | \n", + "1 | \n", + "
| 43 | \n", + "comfort_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 Seats are fine, in fact of all the smaller sedans this is the most comfortable I found for the price as I am 6', 2 and 250# .\\n1 Great gas mileage and comfortable on long trips ... | \n", + "1 | \n", + "
| 28 | \n", + "keyboard_netbook_1005ha | \n", + ", I think the new keyboard rivals the great hp mini keyboards .\\n0 Since the battery life difference is minimum, the only reason to upgrade would be to get the better keyboard .\\n1 The keyboard is now as good as t... | \n", + "1 | \n", + "
| 20 | \n", + "performance_netbook_1005ha | \n", + "The Eee Super Hybrid Engine utility lets users overclock or underclock their Eee PC's to boost performance or provide better battery life depending on their immediate requirements .\\n0 In Super Performance mode CPU, Z shows the bus speed to increase up to 169 .\\n1 One... | \n", + "1 | \n", + "
| 24 | \n", + "quality_toyota_camry_2007 | \n", + "I previously owned a Toyota 4Runner which had incredible build quality and reliability .\\n0 I bought the Camry because of Toyota reliability and qua... | \n", + "1 | \n", + "
| 9 | \n", + "seats_honda_accord_2008 | \n", + "Front seats are very uncomfortable .\\n0 No memory seats, no trip computer, can only display outside temp with trip odometer .\\n1 ... | \n", + "1 | \n", + "
| 10 | \n", + "size_asus_netbook_1005ha | \n", + "A few other things I'd like to point out is that you must push the micro, sized right angle end of the ac adapter until it snaps in place or the battery may not charge .\\n0 The full size right shift k... | \n", + "1 | \n", + "
| 2 | \n", + "speed_windows7 | \n", + "Windows 7 is quite simply faster, more stable, boots faster, goes to sleep faster, comes back from sleep faster, manages your files better and on top of that it's beautiful to look at and easy to use .\\n0 , faster about 20% to 30% faster at running applications than my Vista , seriously\\n1 ... | \n", + "1 | \n", + "
| \n", + " | filename | \n", + "opinion_text | \n", + "cluster_label | \n", + "
|---|---|---|---|
| 46 | \n", + "accuracy_garmin_nuvi_255W_gps | \n", + ", and is very, very accurate .\\n0 but for the most part, we find that the Garmin software provides accurate directions, whereever we intend to go .\\n1 This functi... | \n", + "2 | \n", + "
| 49 | \n", + "buttons_amazon_kindle | \n", + "I thought it would be fitting to christen my Kindle with the Stephen King novella UR, so went to the Amazon site on my computer and clicked on the button to buy it .\\n0 As soon as I'd clicked the button to confirm my order it appeared on my Kindle almost immediately !\\n1 ... | \n", + "2 | \n", + "
| 42 | \n", + "directions_garmin_nuvi_255W_gps | \n", + "You also get upscale features like spoken directions including street names and programmable POIs .\\n0 I used to hesitate to go out of my directions but no... | \n", + "2 | \n", + "
| 48 | \n", + "display_garmin_nuvi_255W_gps | \n", + "3 quot widescreen display was a bonus .\\n0 This made for smoother graphics on the 255w of the vehicle moving along displayed roads, where the 750's display was more of a jerky movement .\\n1 ... | \n", + "2 | \n", + "
| 38 | \n", + "eyesight-issues_amazon_kindle | \n", + "It feels as easy to read as the K1 but doesn't seem any crisper to my eyes .\\n0 the white is really GREY, and to avoid considerable eye, strain I had to refresh pages every other page .\\n1 The dream has always been a portable electronic device that could hold a ton of reading material, automate subscriptions and fa... | \n", + "2 | \n", + "
| 40 | \n", + "features_windows7 | \n", + "I had to uninstall anti, virus and selected other programs, some of which did not have listings in the Programs and Features Control Panel section .\\n0 This review briefly touches upon some of the key features and enhancements of Microsoft's latest OS .\\n1 ... | \n", + "2 | \n", + "
| 34 | \n", + "fonts_amazon_kindle | \n", + "Being able to change the font sizes is awesome !\\n0 For whatever reason, Amazon decided to make the Font on the Home Screen ... | \n", + "2 | \n", + "
| 39 | \n", + "gas_mileage_toyota_camry_2007 | \n", + "Ride seems comfortable and gas mileage fairly good averaging 26 city and 30 open road .\\n0 ... | \n", + "2 | \n", + "
| 36 | \n", + "interior_honda_accord_2008 | \n", + "I love the new body style and the interior is a simple pleasure except for the center dash .\\n0 ... | \n", + "2 | \n", + "
| 26 | \n", + "interior_toyota_camry_2007 | \n", + "First of all, the interior has way too many cheap plastic parts like the cheap plastic center piece that houses the clock .\\n0 3 blown struts at 30,000 miles, interior trim coming loose and rattling squeaking, stains on paint, and bug splats taking paint off, premature uneven brake wear, on 3rd windsh... | \n", + "2 | \n", + "
| 31 | \n", + "mileage_honda_accord_2008 | \n", + "It's quiet, get good gas mileage and looks clean inside and out .\\n0 The mileage is great, and I've had to get used to stopping less for gas .\\n1 Thought gas ... | \n", + "2 | \n", + "
| 30 | \n", + "navigation_amazon_kindle | \n", + "In fact, the entire navigation structure has been completely revised , I'm still getting used to it but it's a huge step forward .\\n0 ... | \n", + "2 | \n", + "
| 18 | \n", + "performance_honda_accord_2008 | \n", + "Very happy with my 08 Accord, performance is quite adequate it has nice looks and is a great long, distance cruiser .\\n0 6, 4, 3 eco engine has poor performance and gas mileage of 22 highway .\\n1 Overall performance is good but comfort level is poor .\\n2 ... | \n", + "2 | \n", + "
| 19 | \n", + "price_amazon_kindle | \n", + "If a case was included, as with the Kindle 1, that would have been reflected in a higher price .\\n0 lower overall price, with nice leather cover .\\n1 ... | \n", + "2 | \n", + "
| 15 | \n", + "satellite_garmin_nuvi_255W_gps | \n", + "It's fast to acquire satellites .\\n0 If you've ever had a Brand X GPS take you on some strange route that adds 20 minutes to your trip, has you turn the wrong way down a one way road, tell you to turn AFTER you've passed the street, frequently loses the satellite signal, or has old maps missing streets, you know how important this stuff is .\\n1 ... | \n", + "2 | \n", + "
| 21 | \n", + "screen_garmin_nuvi_255W_gps | \n", + "It is easy to read and when touching the screen it works great !\\n0 and zoom out buttons on the 255w to the same side of the screen which makes it a bit easier .\\n1 ... | \n", + "2 | \n", + "
| 16 | \n", + "screen_ipod_nano_8gb | \n", + "As always, the video screen is sharp and bright .\\n0 2, inch screen and a glossy, polished aluminum finish that one CNET editor described as looking like a Christmas tree ornament .\\n1 ... | \n", + "2 | \n", + "
| 14 | \n", + "screen_netbook_1005ha | \n", + "Keep in mind that once you get in a room full of light or step outdoors screen reflections could become annoying .\\n0 I've used mine outsi... | \n", + "2 | \n", + "
| 13 | \n", + "sound_ipod_nano_8gb | \n", + "headphone jack i got a clear case for it and it i got a clear case for it and it like prvents me from being able to put the jack all the way in so the sound can b messsed up or i can get it in there and its playing well them go to move or something and it slides out .\\n0 Picture and sound quality are excellent for this typ of devic .\\n1 ... | \n", + "2 | \n", + "
| 11 | \n", + "speed_garmin_nuvi_255W_gps | \n", + "Another feature on the 255w is a display of the posted speed limit on the road which you are currently on right above your current displayed speed .\\n0 I found myself not even looking at my car speedometer as I could easily see my current speed and the speed limit of my route at a glance .\\n1 ... | \n", + "2 | \n", + "
| 6 | \n", + "transmission_toyota_camry_2007 | \n", + "After slowing down, transmission has to be kicked to speed up .\\n0 ... | \n", + "2 | \n", + "
| 0 | \n", + "updates_garmin_nuvi_255W_gps | \n", + "Another thing to consider was that I paid $50 less for the 750 and it came with the FM transmitter cable and a USB cord to connect it to your computer for updates and downloads .\\n0 update and reroute much _more_ quickly than my other GPS .\\n1 UPDATE ON THIS , It finally turned out that to see the elevation contours at lowe... | \n", + "2 | \n", + "
| 3 | \n", + "video_ipod_nano_8gb | \n", + "I bought the 8, gig Ipod Nano that has the built, in video camera .\\n0 Itunes has an on, line store, where you may purchase and download music and videos which will install onto the ipod .\\n1 ... | \n", + "2 | \n", + "
| 1 | \n", + "voice_garmin_nuvi_255W_gps | \n", + "The voice prompts and maps are wonderful especially when driving after dark .\\n0 I also thought the the voice prompts of the 750 where more pleasant sounding than the 255w's .\\n1 ... | \n", + "2 | \n", + "
| \n", + " | id | \n", + "document | \n", + "label | \n", + "
|---|---|---|---|
| 0 | \n", + "9976970 | \n", + "아 더빙.. 진짜 짜증나네요 목소리 | \n", + "0 | \n", + "
| 1 | \n", + "3819312 | \n", + "흠...포스터보고 초딩영화줄....오버연기조차 가볍지 않구나 | \n", + "1 | \n", + "
| 2 | \n", + "10265843 | \n", + "너무재밓었다그래서보는것을추천한다 | \n", + "0 | \n", + "
| \n", + " | count | \n", + "
|---|---|
| label | \n", + "\n", + " |
| 0 | \n", + "75173 | \n", + "
| 1 | \n", + "74827 | \n", + "