From d9a4c4212c19266ce5d8f0794d5e51701e6817cf Mon Sep 17 00:00:00 2001 From: Parth Sharma <56518722+ParthSharmaT@users.noreply.github.com> Date: Tue, 8 Mar 2022 09:24:36 +0530 Subject: [PATCH 1/2] Ml algo --- product_recommendation_system.ipynb | 1273 +++++++++++++++++++++++++++ 1 file changed, 1273 insertions(+) create mode 100644 product_recommendation_system.ipynb diff --git a/product_recommendation_system.ipynb b/product_recommendation_system.ipynb new file mode 100644 index 0000000..019dc19 --- /dev/null +++ b/product_recommendation_system.ipynb @@ -0,0 +1,1273 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "uVyxXyhMRQvd" + }, + "source": [ + "### Amar Shaw\n", + "* Computer Science Engineering,(August, 2019)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "j12wnJZ9RQvs" + }, + "source": [ + "## Product Recommendation System for e-commerce businesses\n", + "A well developed recommendation system will help businesses improve their shopper's experience on website and result in better customer acquisition and retention.\n", + "\n", + "The recommendation system, I have designed below is based on the journey of a new customer from the time he/she lands on the business’s website for the first time to when he/she makes repeat purchases.\n", + "\n", + "The recommendation system is designed in 3 parts based on the business context:\n", + "\n", + "* **Recommendation system part I:** Product pupularity based system targetted at new customers\n", + "\n", + "* **Recommendation system part II:** Model-based collaborative filtering system based on customer's purchase history and ratings provided by other users who bought items similar items\n", + "\n", + "When a new customer without any previous purchase history visits the e-commerce website for the first time, he/she is recommended the most popular products sold on the company's website. Once, he/she makes a purchase, the recommendation system updates and recommends other products based on the purchase history and ratings provided by other users on the website. The latter part is done using collaborative filtering techniques." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "TIv92NNXRQvy" + }, + "source": [ + "## Recommendation System - Part I\n", + "### Product popularity based recommendation system targeted at new customers\n", + "* Popularity based are a great strategy to target the new customers with the most popular products sold on a business's website and is very useful to cold start a recommendation engine.\n", + "[[](http://)](http://)\n", + "* **Dataset : **[Amazon product review dataset](https://www.kaggle.com/skillsmuggler/amazon-ratings)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "e30EFFPSRQv1" + }, + "source": [ + "#### Importing libraries" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "en_1BcMoRQv2" + }, + "outputs": [], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "\n", + "# %matplotlib inline\n", + "plt.style.use(\"ggplot\")\n", + "\n", + "import sklearn\n", + "from sklearn.decomposition import TruncatedSVD" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "wK9fODZ5RQv7" + }, + "source": [ + "#### Loading the dataset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "vPx8TmVZRQv9", + "outputId": "12195e81-9786-4015-d764-9fd97b7ab60c" + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
UserIdProductIdRatingTimestamp
0A39HTATAQ9V7YF02056164615.01369699200
1A3JM6GV9MNOF9X05589252783.01355443200
2A1Z513UWSAAO0F05589252785.01404691200
3A1WMRR494NWEWV07330019984.01382572800
4A3IAAVS479H7M707371044731.01274227200
\n", + "
" + ], + "text/plain": [ + " UserId ProductId Rating Timestamp\n", + "0 A39HTATAQ9V7YF 0205616461 5.0 1369699200\n", + "1 A3JM6GV9MNOF9X 0558925278 3.0 1355443200\n", + "2 A1Z513UWSAAO0F 0558925278 5.0 1404691200\n", + "3 A1WMRR494NWEWV 0733001998 4.0 1382572800\n", + "4 A3IAAVS479H7M7 0737104473 1.0 1274227200" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "amazon_ratings = pd.read_csv('../input/amazon-ratings/ratings_Beauty.csv')\n", + "amazon_ratings = amazon_ratings.dropna()\n", + "amazon_ratings.head()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "jV-HvLqyRQwC", + "outputId": "3d206407-0ddb-49b4-8cbb-f81b6337aff4" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(2023070, 4)" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "amazon_ratings.shape" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "4l-_ugFmRQwE", + "outputId": "d9692d4b-982b-40dc-a66d-dd28f2a6817f" + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Rating
ProductId
B001MA0QY27533
B0009V1YR82869
B0043OYFKU2477
B0000YUXI02143
B003V265QW2088
B000ZMBSPE2041
B003BQ6QXK1918
B004OHQR1Q1885
B00121UVU01838
B000FS05VG1589
\n", + "
" + ], + "text/plain": [ + " Rating\n", + "ProductId \n", + "B001MA0QY2 7533\n", + "B0009V1YR8 2869\n", + "B0043OYFKU 2477\n", + "B0000YUXI0 2143\n", + "B003V265QW 2088\n", + "B000ZMBSPE 2041\n", + "B003BQ6QXK 1918\n", + "B004OHQR1Q 1885\n", + "B00121UVU0 1838\n", + "B000FS05VG 1589" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "popular_products = pd.DataFrame(amazon_ratings.groupby('ProductId')['Rating'].count())\n", + "most_popular = popular_products.sort_values('Rating', ascending=False)\n", + "most_popular.head(10)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "L4H53re1RQwG", + "outputId": "71626e84-88fd-431e-ec17-6f25f56a660e" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "most_popular.head(30).plot(kind = \"bar\")" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "McqPBgQjRQwI" + }, + "source": [ + "** Analysis:**\n", + "\n", + "* The above graph gives us the most popular products (arranged in descending order) sold by the business.\n", + "\n", + "* For eaxmple, product, ID # B001MA0QY2 has sales of over 7000, the next most popular product, ID # B0009V1YR8 has sales of 3000, etc. " + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "kvOxcdF7RQwJ" + }, + "source": [ + "## Recommendation System - Part II\n", + "### Model-based collaborative filtering system\n", + "\n", + "* Recommend items to users based on purchase history and similarity of ratings provided by other users who bought items to that of a particular customer.\n", + "* A model based collaborative filtering technique is closen here as it helps in making predictinfg products for a particular user by identifying patterns based on preferences from multiple user data." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "gzfXKSmaRQwK" + }, + "source": [ + "#### Utility Matrix based on products sold and user reviews\n", + "**Utility Matrix : **An utlity matrix is consists of all possible user-item preferences (ratings) details represented as a matrix. The utility matrix is sparce as none of the users would buy all teh items in the list, hence, most of the values are unknown." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "ibmBXWG-RQwL" + }, + "outputs": [], + "source": [ + "# Subset of Amazon Ratings\n", + "\n", + "amazon_ratings1 = amazon_ratings.head(10000)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "F_5-SZpiRQwN", + "outputId": "3c4253d3-964e-4e9d-a804-1d8e28396ba9" + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ProductId0205616461055892527807330019980737104473076245145913041392121304139220130414089X130414643X1304146537...B000052YPEB000052YPFB000052YPGB000052YPHB000052YPMB000052YPUB000052YPVB000052YPYB000052YQ0B000052YQ2
UserId
A00205921JHJK5X9LNP420000000000...0000000000
A024581134CV80ZBLIZTZ0000000000...0000000000
A03056581JJIOL5FSKJY70000000000...0000000000
A03099101ZRK4K607JVHH0000000000...0000000000
A0505229A7NSH3FRXRR40000000000...0000000000
\n", + "

5 rows × 886 columns

\n", + "
" + ], + "text/plain": [ + "ProductId 0205616461 0558925278 0733001998 0737104473 \\\n", + "UserId \n", + "A00205921JHJK5X9LNP42 0 0 0 0 \n", + "A024581134CV80ZBLIZTZ 0 0 0 0 \n", + "A03056581JJIOL5FSKJY7 0 0 0 0 \n", + "A03099101ZRK4K607JVHH 0 0 0 0 \n", + "A0505229A7NSH3FRXRR4 0 0 0 0 \n", + "\n", + "ProductId 0762451459 1304139212 1304139220 130414089X \\\n", + "UserId \n", + "A00205921JHJK5X9LNP42 0 0 0 0 \n", + "A024581134CV80ZBLIZTZ 0 0 0 0 \n", + "A03056581JJIOL5FSKJY7 0 0 0 0 \n", + "A03099101ZRK4K607JVHH 0 0 0 0 \n", + "A0505229A7NSH3FRXRR4 0 0 0 0 \n", + "\n", + "ProductId 130414643X 1304146537 ... B000052YPE B000052YPF \\\n", + "UserId ... \n", + "A00205921JHJK5X9LNP42 0 0 ... 0 0 \n", + "A024581134CV80ZBLIZTZ 0 0 ... 0 0 \n", + "A03056581JJIOL5FSKJY7 0 0 ... 0 0 \n", + "A03099101ZRK4K607JVHH 0 0 ... 0 0 \n", + "A0505229A7NSH3FRXRR4 0 0 ... 0 0 \n", + "\n", + "ProductId B000052YPG B000052YPH B000052YPM B000052YPU \\\n", + "UserId \n", + "A00205921JHJK5X9LNP42 0 0 0 0 \n", + "A024581134CV80ZBLIZTZ 0 0 0 0 \n", + "A03056581JJIOL5FSKJY7 0 0 0 0 \n", + "A03099101ZRK4K607JVHH 0 0 0 0 \n", + "A0505229A7NSH3FRXRR4 0 0 0 0 \n", + "\n", + "ProductId B000052YPV B000052YPY B000052YQ0 B000052YQ2 \n", + "UserId \n", + "A00205921JHJK5X9LNP42 0 0 0 0 \n", + "A024581134CV80ZBLIZTZ 0 0 0 0 \n", + "A03056581JJIOL5FSKJY7 0 0 0 0 \n", + "A03099101ZRK4K607JVHH 0 0 0 0 \n", + "A0505229A7NSH3FRXRR4 0 0 0 0 \n", + "\n", + "[5 rows x 886 columns]" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ratings_utility_matrix = amazon_ratings1.pivot_table(values='Rating', index='UserId', columns='ProductId', fill_value=0)\n", + "ratings_utility_matrix.head()" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "-WFAJjA9RQwO" + }, + "source": [ + "As expected, the utility matrix obtaned above is sparce, I have filled up the unknown values wth 0." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "e-FK4QPiRQwP", + "outputId": "ba4cdf8b-70fc-4657-caa4-3e819f654f41" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(9697, 886)" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ratings_utility_matrix.shape" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "ReF4Jv8YRQwQ" + }, + "source": [ + "Transposing the matrix" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "1OTKO8PURQwR", + "outputId": "cb8d2480-2b17-43ac-eb01-9da2b2670159" + }, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
UserIdA00205921JHJK5X9LNP42A024581134CV80ZBLIZTZA03056581JJIOL5FSKJY7A03099101ZRK4K607JVHHA0505229A7NSH3FRXRR4A05492663T95KW63BR75KA059547920Q3LZVFHLPI3A07410232KYRFR25CIUGJA082796624UNM47DSAI6KA0864963DOAY7LXGS5I6...AZW1HXXYAC15BAZWRTJPN7NXTAZWTXHXZXFAYPAZYQEFB9Y5N22AZZHB6U54UDYWAZZHJZP4GQPPZAZZNK89PXD006AZZOFVMQC0BJGAZZQXL8VDCFTVAZZTJQ7CQZUD8
ProductId
02056164610000000000...0000000000
05589252780000000000...0000000000
07330019980000000000...0000000000
07371044730000000000...0000000000
07624514590000000000...0000000000
\n", + "

5 rows × 9697 columns

\n", + "
" + ], + "text/plain": [ + "UserId A00205921JHJK5X9LNP42 A024581134CV80ZBLIZTZ \\\n", + "ProductId \n", + "0205616461 0 0 \n", + "0558925278 0 0 \n", + "0733001998 0 0 \n", + "0737104473 0 0 \n", + "0762451459 0 0 \n", + "\n", + "UserId A03056581JJIOL5FSKJY7 A03099101ZRK4K607JVHH \\\n", + "ProductId \n", + "0205616461 0 0 \n", + "0558925278 0 0 \n", + "0733001998 0 0 \n", + "0737104473 0 0 \n", + "0762451459 0 0 \n", + "\n", + "UserId A0505229A7NSH3FRXRR4 A05492663T95KW63BR75K \\\n", + "ProductId \n", + "0205616461 0 0 \n", + "0558925278 0 0 \n", + "0733001998 0 0 \n", + "0737104473 0 0 \n", + "0762451459 0 0 \n", + "\n", + "UserId A059547920Q3LZVFHLPI3 A07410232KYRFR25CIUGJ \\\n", + "ProductId \n", + "0205616461 0 0 \n", + "0558925278 0 0 \n", + "0733001998 0 0 \n", + "0737104473 0 0 \n", + "0762451459 0 0 \n", + "\n", + "UserId A082796624UNM47DSAI6K A0864963DOAY7LXGS5I6 ... AZW1HXXYAC15B \\\n", + "ProductId ... \n", + "0205616461 0 0 ... 0 \n", + "0558925278 0 0 ... 0 \n", + "0733001998 0 0 ... 0 \n", + "0737104473 0 0 ... 0 \n", + "0762451459 0 0 ... 0 \n", + "\n", + "UserId AZWRTJPN7NXT AZWTXHXZXFAYP AZYQEFB9Y5N22 AZZHB6U54UDYW \\\n", + "ProductId \n", + "0205616461 0 0 0 0 \n", + "0558925278 0 0 0 0 \n", + "0733001998 0 0 0 0 \n", + "0737104473 0 0 0 0 \n", + "0762451459 0 0 0 0 \n", + "\n", + "UserId AZZHJZP4GQPPZ AZZNK89PXD006 AZZOFVMQC0BJG AZZQXL8VDCFTV \\\n", + "ProductId \n", + "0205616461 0 0 0 0 \n", + "0558925278 0 0 0 0 \n", + "0733001998 0 0 0 0 \n", + "0737104473 0 0 0 0 \n", + "0762451459 0 0 0 0 \n", + "\n", + "UserId AZZTJQ7CQZUD8 \n", + "ProductId \n", + "0205616461 0 \n", + "0558925278 0 \n", + "0733001998 0 \n", + "0737104473 0 \n", + "0762451459 0 \n", + "\n", + "[5 rows x 9697 columns]" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X = ratings_utility_matrix.T\n", + "X.head()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "Oi8aiLZnRQwS", + "outputId": "f73c7e22-fe61-487d-86ef-0c6dfd4efdd4" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(886, 9697)" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X.shape" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "6ZuWY0roRQwT" + }, + "source": [ + "Unique products in subset of data" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "80cPGLhERQwU" + }, + "outputs": [], + "source": [ + "X1 = X" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "NwPaVyP8RQwV" + }, + "source": [ + "### Decomposing the Matrix" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "QHHmjYQXRQwV", + "outputId": "33051977-14c1-4f53-f1d3-cad62aa54e54" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(886, 10)" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "SVD = TruncatedSVD(n_components=10)\n", + "decomposed_matrix = SVD.fit_transform(X)\n", + "decomposed_matrix.shape" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "9kQz_tcmRQwX" + }, + "source": [ + "### Correlation Matrix" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "GZmekSFzRQwX", + "outputId": "c4a9fd5e-4f2d-4180-a0f4-2d70c5b44f79" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(886, 886)" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "correlation_matrix = np.corrcoef(decomposed_matrix)\n", + "correlation_matrix.shape" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "QVyqnlnVRQwY" + }, + "source": [ + "correlation_matrix" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "_4tCGms0RQwZ" + }, + "source": [ + "### Isolating Product ID # 6117036094 from the Correlation Matrix\n", + "\n", + "Assuming the customer buys Product ID # 6117036094 (randomly chosen)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "scrolled": true, + "id": "86-tm5xqRQwZ", + "outputId": "38e66f5a-99c4-4f7c-eb5b-ddd8653d0bf8" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "'6117036094'" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X.index[99]" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "xJWcpIt1RQwa" + }, + "source": [ + "Index # of product ID purchased by customer" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "B8nK5ri2RQwa", + "outputId": "68860da5-cdad-4444-c120-5f66ffd786c1" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "99" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "i = \"6117036094\"\n", + "\n", + "product_names = list(X.index)\n", + "product_ID = product_names.index(i)\n", + "product_ID" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "bG4yDqdLRQwb" + }, + "source": [ + "Correlation for all items with the item purchased by this customer based on items rated by other customers people who bought the same product" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "fkfxflgaRQwc", + "outputId": "89576824-71c5-4ecb-d664-144c0b080524" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "(886,)" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "correlation_product_ID = correlation_matrix[product_ID]\n", + "correlation_product_ID.shape" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "HdJGseMxRQwd" + }, + "source": [ + "### Recommending top 10 highly correlated products in sequence" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "gUmGy1lrRQwd", + "outputId": "29e601e8-94b5-4d1c-f9a5-2b27524efcff" + }, + "outputs": [ + { + "data": { + "text/plain": [ + "['0733001998',\n", + " '1304139212',\n", + " '1304139220',\n", + " '130414089X',\n", + " '130414643X',\n", + " '130414674X',\n", + " '1304174778',\n", + " '1304174867',\n", + " '1304174905']" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "Recommend = list(X.index[correlation_product_ID > 0.90])\n", + "\n", + "# Removes the item already bought by the customer\n", + "Recommend.remove(i) \n", + "\n", + "Recommend[0:9]" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "yx0g7kbmRQwe" + }, + "source": [ + "**Product Id # **\n", + "Here are the top 10 products to be displayed by the recommendation system to the above customer based on the purchase history of other customers in the website. " + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.6" + }, + "colab": { + "name": "product-recommendation-system.ipynb", + "provenance": [] + } + }, + "nbformat": 4, + "nbformat_minor": 0 +} \ No newline at end of file From 1ed30ed0da3959213858091c2f443fa7be591254 Mon Sep 17 00:00:00 2001 From: Parth Sharma <56518722+ParthSharmaT@users.noreply.github.com> Date: Tue, 8 Mar 2022 11:19:54 +0530 Subject: [PATCH 2/2] Ml model --- product_recommendation_system.ipynb | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/product_recommendation_system.ipynb b/product_recommendation_system.ipynb index 019dc19..5b148e6 100644 --- a/product_recommendation_system.ipynb +++ b/product_recommendation_system.ipynb @@ -6,8 +6,8 @@ "id": "uVyxXyhMRQvd" }, "source": [ - "### Amar Shaw\n", - "* Computer Science Engineering,(August, 2019)" + "### Parth Sharma\n", + "* Computer Science and Engineering,(March, 2022)" ] }, { @@ -1270,4 +1270,4 @@ }, "nbformat": 4, "nbformat_minor": 0 -} \ No newline at end of file +}