From fa3c3a0bee06bd4e3336d367dc9397f49fe9c02d Mon Sep 17 00:00:00 2001 From: aahanatiwari <109433019+aahanatiwari@users.noreply.github.com> Date: Mon, 5 Jun 2023 19:50:33 +0530 Subject: [PATCH 1/2] Create aahana.txt --- aahana.txt | 1 + 1 file changed, 1 insertion(+) create mode 100644 aahana.txt diff --git a/aahana.txt b/aahana.txt new file mode 100644 index 0000000..8e23d96 --- /dev/null +++ b/aahana.txt @@ -0,0 +1 @@ +Aahana From 834db1a076a59d5c462602947b076821e5cc8177 Mon Sep 17 00:00:00 2001 From: aahanatiwari <109433019+aahanatiwari@users.noreply.github.com> Date: Sun, 9 Jul 2023 22:13:20 +0530 Subject: [PATCH 2/2] Created using Colaboratory --- Python_ML_Research.ipynb | 854 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 854 insertions(+) create mode 100644 Python_ML_Research.ipynb diff --git a/Python_ML_Research.ipynb b/Python_ML_Research.ipynb new file mode 100644 index 0000000..7011349 --- /dev/null +++ b/Python_ML_Research.ipynb @@ -0,0 +1,854 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "authorship_tag": "ABX9TyMRTk7cN5kN0H1GuTdWLxq3", + "include_colab_link": true + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "view-in-github", + "colab_type": "text" + }, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "id": "G9iiwNbhM6nW" + }, + "outputs": [], + "source": [ + "import numpy as np\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "source": [ + "df = pd.read_csv('/content/sample_data/flipkart_reviews_large_dataset_sample.csv')" + ], + "metadata": { + "id": "agzK0iRoND7y" + }, + "execution_count": 7, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "df" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 1000 + }, + "id": "ZK0WmaxtV9KJ", + "outputId": "bca6b42b-f731-49de-f448-257b37d73f04" + }, + "execution_count": 8, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " ProductUrl \\\n", + "0 https://www.flipkart.com/samsung-galaxy-nxt-go... \n", + "1 https://www.flipkart.com/samsung-galaxy-nxt-go... \n", + "2 https://www.flipkart.com/samsung-galaxy-nxt-go... \n", + "3 https://www.flipkart.com/samsung-galaxy-nxt-go... \n", + "4 https://www.flipkart.com/samsung-galaxy-nxt-go... \n", + ".. ... \n", + "669 https://www.flipkart.com/apple-iphone-12-blue-... \n", + "670 https://www.flipkart.com/zebronics-wireless-to... \n", + "671 https://www.flipkart.com/apple-iphone-12-blue-... \n", + "672 https://www.flipkart.com/zebronics-wireless-to... \n", + "673 https://www.flipkart.com/mmshopy-heavy-duty-ad... \n", + "\n", + " productTitle productPrice \\\n", + "0 SAMSUNG Galaxy On Nxt (Gold, 16 GB) ₹9,499 \n", + "1 SAMSUNG Galaxy On Nxt (Gold, 16 GB) ₹9,499 \n", + "2 SAMSUNG Galaxy On Nxt (Gold, 16 GB) ₹9,499 \n", + "3 SAMSUNG Galaxy On Nxt (Gold, 16 GB) ₹9,499 \n", + "4 SAMSUNG Galaxy On Nxt (Gold, 16 GB) ₹9,499 \n", + ".. ... ... \n", + "669 APPLE iPhone 12 (Blue, 128 GB) ₹64,999 \n", + "670 ZEBRONICS Wireless Totem 3 Wireless Optical Mouse ₹374 \n", + "671 APPLE iPhone 12 (Blue, 128 GB) ₹64,999 \n", + "672 ZEBRONICS Wireless Totem 3 Wireless Optical Mouse ₹374 \n", + "673 MMShopy Heavy Duty Adjustable Smartphone Phone... ₹219 \n", + "\n", + " averageRating reviewTitle \\\n", + "0 4.3 Just wow! \n", + "1 4.3 Awesome \n", + "2 4.3 Does the job \n", + "3 4.3 Good \n", + "4 4.3 Wonderful \n", + ".. ... ... \n", + "669 4.7 Highly recommended \n", + "670 3.7 Awesome \n", + "671 4.7 Pretty good \n", + "672 3.7 NaN \n", + "673 4.1 Best in the market! \n", + "\n", + " reviewDescription \\\n", + "0 unbelievable \n", + "1 good mobile \n", + "2 good \n", + "3 it's good \n", + "4 very nice \n", + ".. ... \n", + "669 amazing experience moving from android to ios \n", + "670 The product is so cheap and it is working prop... \n", + "671 Mind blowing camera \n", + "672 got a defected moues at first ,flipkart replac... \n", + "673 Excellent quality \n", + "\n", + " reviewAuthor reviewAt reviewLikes reviewDislikes \\\n", + "0 KOUSIK DUTTA Aug, 2018 0 0 \n", + "1 Flipkart Customer Aug, 2018 0 0 \n", + "2 Rakesh Ranjan Aug, 2018 0 0 \n", + "3 PabiT Gouda Aug, 2018 0 0 \n", + "4 Sujal Patel Aug, 2018 0 0 \n", + ".. ... ... ... ... \n", + "669 sidharth gurjar 3 months ago 0 0 \n", + "670 Hyma Gumpu Jan, 2015 0 0 \n", + "671 Vikas Kumar 3 months ago 0 0 \n", + "672 viresh gupta Jan, 2015 0 0 \n", + "673 Indrala Lakshmi Narayana 14 days ago 0 0 \n", + "\n", + " certifiedBuyer reviewerLocation fiveStarRatingCount \\\n", + "0 True Burdwan 2,20,147 \n", + "1 True Kurnool 2,20,147 \n", + "2 True Noida 2,20,147 \n", + "3 True Behror 2,20,147 \n", + "4 True Dharampur 2,20,147 \n", + ".. ... ... ... \n", + "669 True Raja Sansi 1,29,344 \n", + "670 True Vishakhapatnam 705 \n", + "671 True Samastipur District 1,29,344 \n", + "672 True Ghaziabad 705 \n", + "673 True Metpally 3,473 \n", + "\n", + " fourStarRatingCount threeStarRatingCount twoStarRatingCount \\\n", + "0 83,936 30,026 10,267 \n", + "1 83,936 30,026 10,267 \n", + "2 83,936 30,026 10,267 \n", + "3 83,936 30,026 10,267 \n", + "4 83,936 30,026 10,267 \n", + ".. ... ... ... \n", + "669 20,895 4,588 1,637 \n", + "670 397 249 136 \n", + "671 20,895 4,588 1,637 \n", + "672 397 249 136 \n", + "673 1,778 877 350 \n", + "\n", + " oneStarRatingCount reviewImages \\\n", + "0 21,199 NaN \n", + "1 21,199 NaN \n", + "2 21,199 NaN \n", + "3 21,199 NaN \n", + "4 21,199 NaN \n", + ".. ... ... \n", + "669 5,381 NaN \n", + "670 214 NaN \n", + "671 5,381 NaN \n", + "672 214 NaN \n", + "673 497 https://rukminim1.flixcart.com/blobio/124/124/... \n", + "\n", + " scrapedAt uniqId \n", + "0 21-02-2022 00:57 db7fc5e1-684d-5d92-a41b-25e40f37c0fe \n", + "1 21-02-2022 00:57 a2661c23-13b4-5823-959d-4324b9442056 \n", + "2 21-02-2022 00:57 0f2d6a35-7f63-57f8-8d20-0c8ab3141c74 \n", + "3 21-02-2022 00:57 f39db306-aca5-5c62-a75b-a9248de9566f \n", + "4 21-02-2022 00:57 27d2b3b2-7034-52b8-9b64-df5778853f44 \n", + ".. ... ... \n", + "669 21-02-2022 00:57 4fe5dd26-5fd1-5a2d-a401-d2c2791bc53b \n", + "670 21-02-2022 00:57 81e2bf7d-1e4d-5adc-8dea-e419e77d4565 \n", + "671 21-02-2022 00:57 6ad5677e-85b1-5c85-8dcc-93e8b612c97a \n", + "672 21-02-2022 00:57 e976ceae-4818-5456-9491-aaf38dc340ed \n", + "673 21-02-2022 00:57 bd1f5cd5-b465-55c3-b5b4-a08579e179af \n", + "\n", + "[674 rows x 20 columns]" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ProductUrlproductTitleproductPriceaverageRatingreviewTitlereviewDescriptionreviewAuthorreviewAtreviewLikesreviewDislikescertifiedBuyerreviewerLocationfiveStarRatingCountfourStarRatingCountthreeStarRatingCounttwoStarRatingCountoneStarRatingCountreviewImagesscrapedAtuniqId
0https://www.flipkart.com/samsung-galaxy-nxt-go...SAMSUNG Galaxy On Nxt (Gold, 16 GB)₹9,4994.3Just wow!unbelievableKOUSIK DUTTAAug, 201800TrueBurdwan2,20,14783,93630,02610,26721,199NaN21-02-2022 00:57db7fc5e1-684d-5d92-a41b-25e40f37c0fe
1https://www.flipkart.com/samsung-galaxy-nxt-go...SAMSUNG Galaxy On Nxt (Gold, 16 GB)₹9,4994.3Awesomegood mobileFlipkart CustomerAug, 201800TrueKurnool2,20,14783,93630,02610,26721,199NaN21-02-2022 00:57a2661c23-13b4-5823-959d-4324b9442056
2https://www.flipkart.com/samsung-galaxy-nxt-go...SAMSUNG Galaxy On Nxt (Gold, 16 GB)₹9,4994.3Does the jobgoodRakesh RanjanAug, 201800TrueNoida2,20,14783,93630,02610,26721,199NaN21-02-2022 00:570f2d6a35-7f63-57f8-8d20-0c8ab3141c74
3https://www.flipkart.com/samsung-galaxy-nxt-go...SAMSUNG Galaxy On Nxt (Gold, 16 GB)₹9,4994.3Goodit's goodPabiT GoudaAug, 201800TrueBehror2,20,14783,93630,02610,26721,199NaN21-02-2022 00:57f39db306-aca5-5c62-a75b-a9248de9566f
4https://www.flipkart.com/samsung-galaxy-nxt-go...SAMSUNG Galaxy On Nxt (Gold, 16 GB)₹9,4994.3Wonderfulvery niceSujal PatelAug, 201800TrueDharampur2,20,14783,93630,02610,26721,199NaN21-02-2022 00:5727d2b3b2-7034-52b8-9b64-df5778853f44
...............................................................
669https://www.flipkart.com/apple-iphone-12-blue-...APPLE iPhone 12 (Blue, 128 GB)₹64,9994.7Highly recommendedamazing experience moving from android to iossidharth gurjar3 months ago00TrueRaja Sansi1,29,34420,8954,5881,6375,381NaN21-02-2022 00:574fe5dd26-5fd1-5a2d-a401-d2c2791bc53b
670https://www.flipkart.com/zebronics-wireless-to...ZEBRONICS Wireless Totem 3 Wireless Optical Mouse₹3743.7AwesomeThe product is so cheap and it is working prop...Hyma GumpuJan, 201500TrueVishakhapatnam705397249136214NaN21-02-2022 00:5781e2bf7d-1e4d-5adc-8dea-e419e77d4565
671https://www.flipkart.com/apple-iphone-12-blue-...APPLE iPhone 12 (Blue, 128 GB)₹64,9994.7Pretty goodMind blowing cameraVikas Kumar3 months ago00TrueSamastipur District1,29,34420,8954,5881,6375,381NaN21-02-2022 00:576ad5677e-85b1-5c85-8dcc-93e8b612c97a
672https://www.flipkart.com/zebronics-wireless-to...ZEBRONICS Wireless Totem 3 Wireless Optical Mouse₹3743.7NaNgot a defected moues at first ,flipkart replac...viresh guptaJan, 201500TrueGhaziabad705397249136214NaN21-02-2022 00:57e976ceae-4818-5456-9491-aaf38dc340ed
673https://www.flipkart.com/mmshopy-heavy-duty-ad...MMShopy Heavy Duty Adjustable Smartphone Phone...₹2194.1Best in the market!Excellent qualityIndrala Lakshmi Narayana14 days ago00TrueMetpally3,4731,778877350497https://rukminim1.flixcart.com/blobio/124/124/...21-02-2022 00:57bd1f5cd5-b465-55c3-b5b4-a08579e179af
\n", + "

674 rows × 20 columns

\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ] + }, + "metadata": {}, + "execution_count": 8 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.columns" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "mIvnrn1hV-Qh", + "outputId": "7b068032-e18e-4d98-8e3b-d90605657e25" + }, + "execution_count": 9, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "Index(['ProductUrl', 'productTitle', 'productPrice', 'averageRating',\n", + " 'reviewTitle', 'reviewDescription', 'reviewAuthor', 'reviewAt',\n", + " 'reviewLikes', 'reviewDislikes', 'certifiedBuyer', 'reviewerLocation',\n", + " 'fiveStarRatingCount', 'fourStarRatingCount', 'threeStarRatingCount',\n", + " 'twoStarRatingCount', 'oneStarRatingCount', 'reviewImages', 'scrapedAt',\n", + " 'uniqId'],\n", + " dtype='object')" + ] + }, + "metadata": {}, + "execution_count": 9 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.describe()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 300 + }, + "id": "2VeZNgeZWO0e", + "outputId": "9c85107d-7234-4f87-88d6-2e29ab110585" + }, + "execution_count": 10, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + " averageRating reviewLikes reviewDislikes\n", + "count 674.000000 674.000000 674.000000\n", + "mean 4.259347 0.670623 0.290801\n", + "std 0.222995 5.236584 3.097476\n", + "min 3.600000 0.000000 0.000000\n", + "25% 4.100000 0.000000 0.000000\n", + "50% 4.300000 0.000000 0.000000\n", + "75% 4.400000 0.000000 0.000000\n", + "max 4.700000 72.000000 64.000000" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
averageRatingreviewLikesreviewDislikes
count674.000000674.000000674.000000
mean4.2593470.6706230.290801
std0.2229955.2365843.097476
min3.6000000.0000000.000000
25%4.1000000.0000000.000000
50%4.3000000.0000000.000000
75%4.4000000.0000000.000000
max4.70000072.00000064.000000
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ] + }, + "metadata": {}, + "execution_count": 10 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.dtypes" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "LQXjnoufWUFO", + "outputId": "2efa2696-42ae-4147-e048-300502528f00" + }, + "execution_count": 15, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "ProductUrl object\n", + "productTitle object\n", + "productPrice object\n", + "averageRating float64\n", + "reviewTitle object\n", + "reviewDescription object\n", + "reviewAuthor object\n", + "reviewAt object\n", + "reviewLikes int64\n", + "reviewDislikes int64\n", + "certifiedBuyer bool\n", + "reviewerLocation object\n", + "fiveStarRatingCount object\n", + "fourStarRatingCount object\n", + "threeStarRatingCount object\n", + "twoStarRatingCount object\n", + "oneStarRatingCount object\n", + "reviewImages object\n", + "scrapedAt object\n", + "uniqId object\n", + "dtype: object" + ] + }, + "metadata": {}, + "execution_count": 15 + } + ] + }, + { + "cell_type": "code", + "source": [], + "metadata": { + "id": "JFWAOFqJWdVi" + }, + "execution_count": null, + "outputs": [] + } + ] +} \ No newline at end of file