From 6131d4c2c76d75f1f0abcf50907c0d27c473202c Mon Sep 17 00:00:00 2001 From: gk552 <104007378+gk552@users.noreply.github.com> Date: Sat, 4 Jun 2022 00:38:03 +0530 Subject: [PATCH] Add files via upload --- Anaconda.md | 47 +++ Jupyter Notebook.ipynb | 84 +++++ Metplotlib.ipynb | 219 +++++++++++ Numpy Notebook.ipynb | 544 +++++++++++++++++++++++++++ Pandas Notebook.ipynb | 826 +++++++++++++++++++++++++++++++++++++++++ 5 files changed, 1720 insertions(+) create mode 100644 Anaconda.md create mode 100644 Jupyter Notebook.ipynb create mode 100644 Metplotlib.ipynb create mode 100644 Numpy Notebook.ipynb create mode 100644 Pandas Notebook.ipynb diff --git a/Anaconda.md b/Anaconda.md new file mode 100644 index 0000000..7fc8fb1 --- /dev/null +++ b/Anaconda.md @@ -0,0 +1,47 @@ + +# Anaconda + +# What is Anaconda? +Anaconda is an open source handy toolkit for dvelopers. It makes job easy for the developers by enabling them to create specific Working Environments and work in them. + + + ## But What Is Working Environment? + Let's understand this with an easy example. Let's say you are designing a house. Every room has its Environment, and according to the nature of that Environment, we add different items to that room. For example, In Kitchen, we will install a sink and gas stove and additional shelves for utensils and vegetables; just like this, we will install different items in our bedroom and living room. +Now think of this as a developer. A developer is working on various projects simultaneously, and they'll need different packages for different projects. With the help of Anaconda, they can create different **Working Environments** with these different packages that they can access anytime. They'll not have to install these packages every time they switch from one project to another; instead, they switch from one Environment to the other, and they will easily have access to all these packages. +They can also modify these **Working Environments** by adding, removing, or updating any package anytime. + +--- + +# Installing Anaconda. + +* Search **Anaconda Install** in your Web Browser. +* Click on Anaconda Distribution link that appears. +* A download option appears on the right part of your screen. Click on download button and wait till it downloads. +* Click on the exectable file which is downloaded and follow simple steps that will follow on screen. Just make sure about the following: + + While installing select Install for **Just Me** option. + + Select **Add Anaconda to my PATH environment variable**. ++ Now wait till it installs and then we can work with Anaconda Prompt. +--- +# Working in an Environment in Anaconda +## Creating an Environment +Open the Anaconda command prompt. You'll be direct to a base environment in Anaconda. +To setup a new Environment, type **"conda create -- name NAME python version"** (without inverted commas) +Here, NAME is the name of the environment you want to create and Python version will specify which version of pyhton you want to work with in this environment. +*for example:* ***conda create --name basisoflearning python=3.9*** will create an environment named 'basisoflearning' which will work with python 3.9 +### To enter the environment, +type ***conda activate basisoflearning*** and you'll enter basisoflearning environment. +### To install any package in the Environment, +we will have to give different commands to download different packages in Anaconda which are easily available on the web. +*for example :* to install NumPy we can give command ***conda instll -c anaconda numpy***. this will install numpy i the environment. + +### To exit the environment, +type ***conda deactivate*** and you'll head out of that environment. + +--- + +## Other Important Commands Examples. + + +* ***conda list*** command fetches us list of all the packages installed in the environment. +* ***conda update numpy*** will update numpy library to its latest version. +* ***conda env list*** gives list of all the environments created on the system. \ No newline at end of file diff --git a/Jupyter Notebook.ipynb b/Jupyter Notebook.ipynb new file mode 100644 index 0000000..e8d2031 --- /dev/null +++ b/Jupyter Notebook.ipynb @@ -0,0 +1,84 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "5e222e60", + "metadata": {}, + "source": [ + "# How to Install Jupyter Notebook?\n", + "* open command prompt.\n", + "* type **pip install jupyter** \n", + "This will install Jupyter in the system." + ] + }, + { + "cell_type": "markdown", + "id": "780f90dd", + "metadata": {}, + "source": [ + "# Creating a Notebook\n", + "In command prompt type **jupyter notebook**. This will open jupyter notebook in the browser. \n", + "# Creating a Notebook\n", + "* Click on the New button (upper right).\n", + "* It will open up a list of choices. Choose the version of python you want to create the notebook in.\n", + "* It will open a new Jupyter Notebook in the browser.\n" + ] + }, + { + "cell_type": "markdown", + "id": "c442f20a", + "metadata": {}, + "source": [ + "# Cells \n", + "cells in jupyter notebook are used to excute chuks of code by default but we can cahneg the celltype to markdown or raw NB converter according to our need. These cells will execute only the code written in them on clicking on Run button in the taskbar or pressing **Shift + Enter**. *for example:*" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "e8c00aa2", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Basis Of Learning\n" + ] + } + ], + "source": [ + "print(\"Basis Of Learning\")" + ] + }, + { + "cell_type": "markdown", + "id": "a0683d7d", + "metadata": {}, + "source": [ + "These Cells get excuted in a specific sequence whic is usually mentioned in front of them. We can change the sequence in which they will be executed, Add as many ceels as required and Delete cells." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/Metplotlib.ipynb b/Metplotlib.ipynb new file mode 100644 index 0000000..9b1c872 --- /dev/null +++ b/Metplotlib.ipynb @@ -0,0 +1,219 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "3f6185f4", + "metadata": {}, + "source": [ + "# Matplotlib" + ] + }, + { + "cell_type": "markdown", + "id": "9cf85aeb", + "metadata": {}, + "source": [ + "Matplotlib is a data visualization library. It helps to create visual reprenstation of data i.e. explain data through graphs, pie charts, scatters and histograms." + ] + }, + { + "cell_type": "markdown", + "id": "2c33ebd5", + "metadata": {}, + "source": [ + "### Visual Representation of data using Matplotlib." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "ca7e3a0e", + "metadata": {}, + "outputs": [], + "source": [ + "%matplotlib inline #enable the inline plotting, where the plots/graphs will be displayed just below the cell where your plotting commands are written.\n", + "from matplotlib import pyplot as plt #pyplot from matplotlib is responsible to create graphs." + ] + }, + { + "cell_type": "markdown", + "id": "936f998d", + "metadata": {}, + "source": [ + "### Creating Plot using Matplotlib." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "f0985e66", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "x1 = [1,4,6,10] #specifying points required for plotting.\n", + "y1 = [3,7,11,15]\n", + "x2 = [2,6,10]\n", + "y2 = [15,8,2]\n", + "\n", + "# to create a plot, use .plot() command.\n", + "plt.plot(x1,y1) #plots the points on graph\n", + "plt.plot(x2,y2)\n", + "plt.show() #shows the graph." + ] + }, + { + "cell_type": "markdown", + "id": "c9fd4d7a", + "metadata": {}, + "source": [ + "We can also edit these graphs, add heading, label axis and label graphs in case there are more than one set of data is plotted on the same graph." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "29e17ba3", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "#consider the same example.\n", + "plt.plot(x1,y1, label='First') \n", + "plt.plot(x2,y2, label= 'Second')\n", + "plt.title(\"DEMO GRAPH\") #Adds Title to the Plot\n", + "plt.ylabel('Y Axis') # labels y axis\n", + "plt.xlabel('X Axis') # labels x axis\n", + "plt.legend() #The labelling of individual plots wouldn't shwo up in graph unless we use this command\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "id": "49bb4d19", + "metadata": {}, + "source": [ + "Just like this we can pot other types of graphs also. They can be executed using different comands which are easily available in metplotlib documentation online along with the type of arguments they take to plot the data." + ] + }, + { + "cell_type": "markdown", + "id": "e6e0c19b", + "metadata": {}, + "source": [ + "For example we can plor scatter of the same data as follows:\n" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "f3ed11f1", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAD4CAYAAAD1jb0+AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAAOgUlEQVR4nO3df2jc933H8ddrkkrPWWul+NJVVpjTUbQN4+Fyf6QNdKNqUKD54T82k0CG1wX8z6izsimLVkhK/iqoLG0YdJg0TaDBxXia25SuinFXwiALyFZquXG0QJvaktz6QpA3uoMo7nt/3Mm2zpZ1d9+v9L2P9Xz8c7rPne/75kv8zNff+57OESEAQHp+p+gBAACdIeAAkCgCDgCJIuAAkCgCDgCJ6t3IjW3bti127NixkZsEgOSdOHHinYgoN69vaMB37NihqampjdwkACTP9i+vt84pFABIFAEHgEQRcABIFAEHgEQRcABI1IZehZK0U4el409JF+ekrYPS8BPSrr1FTwWgyx2dntf45KwWFmsa6C9pdGRIe3Zvz+W1CXgrTh2WXjogLdXq9y+eq9+XiDiAVR2dntfYxIxqS5ckSfOLNY1NzEhSLhHnFEorjj91Jd7Llmr1dQBYxfjk7OV4L6stXdL45Gwur0/AW3Fxrr11AJC0sFhra71dBLwVWwfbWwcASQP9pbbW20XAWzH8hNTXtMP7SvV1AFjF6MiQSn09K9ZKfT0aHRnK5fV5E7MVy29UchUKgDYsv1G5XleheCO/E7NSqQS/zAoA2mP7RERUmtc5hQIAiSLgAJAoAg4AiSLgAJAoAg4AiSLgAJAoAg4AiVoz4Lafs33B9unrPPb3tsP2tvUZDwCwmlaOwJ+XdE/zou3bJd0t6WzOMwEAWrBmwCPiFUnvXuehpyU9JmnjPsoJALiso3Pgtu+XNB8RP23hufttT9meqlarnWwOAHAdbQfc9hZJX5bU0q/ii4iDEVGJiEq5XG53cwCAVXRyBP4Hku6Q9FPbb0salHTS9u/lORgA4Mba/nWyETEj6bbl+42IVyLinRznAgCsoZXLCA9JelXSkO0524+s/1gAgLWseQQeEQ+t8fiO3KYBALSMT2ICQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAkas2A237O9gXbp69aG7f9pu1Ttv/Ndv+6TgkAuEYrR+DPS7qnae2YpJ0RsUvSf0say3kuAMAa1gx4RLwi6d2mtZcj4v3G3f+SNLgOswEAbiCPc+B/LenfV3vQ9n7bU7anqtVqDpsDAEgZA277y5Lel/Tias+JiIMRUYmISrlczrI5AMBVejv9g7b3SbpX0nBERH4jAQBa0VHAbd8j6R8k/WlE/F++IwEAWtHKZYSHJL0qacj2nO1HJP2zpA9JOmb7ddv/ss5zAgCarHkEHhEPXWf5W+swCwCgDXwSEwASRcABIFEEHAASRcABIFEEHAASRcABIFEdfxITQN3R6XmNT85qYbGmgf6SRkeGtGf39qLHwiZAwIEMjk7Pa2xiRrWlS5Kk+cWaxiZmJImIY91xCgXIYHxy9nK8l9WWLml8cragibCZEHAgg4XFWlvrQJ4IOJDBQH+prXUgTwQcyGB0ZEilvp4Va6W+Ho2ODBU0ETYT3sQEMlh+o5KrUFAEAg5ktGf3doKNQnAKBQASRcABIFEEHAASRcABIFEEHAASRcABIFEEHAAStWbAbT9n+4Lt01etfcT2MdtvNW5vXd8xAQDNWjkCf17SPU1rj0s6HhGfkHS8cR8AsIHWDHhEvCLp3ablByS90Pj5BUl78h0LALCWTs+BfzQizktS4/a21Z5oe7/tKdtT1Wq1w80BAJqt+5uYEXEwIioRUSmXy+u9OQDYNDoN+K9tf0ySGrcX8hsJANCKTgP+fUn7Gj/vk/S9fMYBALSqlcsID0l6VdKQ7Tnbj0j6qqS7bb8l6e7GfQDABlrz94FHxEOrPDSc8ywAgDbwSUwASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEZQq47S/Z/pnt07YP2f5gXoMByTh1WHp6p/SV/vrtqcNFT4RNouOA294u6YCkSkTslNQj6cG8BgOScOqw9NIB6eI5SVG/fekAEceGyHoKpVdSyXavpC2SFrKPBCTk+FPSUm3l2lKtvg6ss44DHhHzkr4m6ayk85IuRsTLzc+zvd/2lO2parXa+aRAN7o41946kKMsp1BulfSApDskDUi6xfbDzc+LiIMRUYmISrlc7nxSoBttHWxvHchRllMon5P0i4ioRsSSpAlJn85nLCARw09IfaWVa32l+jqwzrIE/KykO21vsW1Jw5LO5DMWkIhde6X7npG23i7J9dv7nqmvA+ust9M/GBGv2T4i6aSk9yVNSzqY12BAMnbtJdgoRMcBl6SIeFLSkznNAgBoA5/EBIBEEXAASBQBB4BEEXAASBQBB4BEEXAASFSmywixeR2dntf45KwWFmsa6C9pdGRIe3ZvL3osYFMh4Gjb0el5jU3MqLZ0SZI0v1jT2MSMJBFxYANxCgVtG5+cvRzvZbWlSxqfnC1oImBzIuBo28Jira11AOuDgKNtA/2lttYBrA8CjraNjgyp1NezYq3U16PRkaGCJgI2J97ERNuW36jkKhSgWAQcHdmzezvBBgrGKRQASBQBB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASFSmgNvut33E9pu2z9j+VF6DAQBuLOsHeb4h6UcR8ee2PyBpSw4zAQBa0HHAbX9Y0mck/ZUkRcR7kt7LZywAwFqynEL5uKSqpG/bnrb9rO1bmp9ke7/tKdtT1Wo1w+YAAFfLEvBeSZ+U9M2I2C3pN5Ieb35SRByMiEpEVMrlcobNAQCuliXgc5LmIuK1xv0jqgcdALABOg54RPxK0jnby78EeljSG7lMBQBYU9arUL4o6cXGFSg/l/SF7CMBAFqRKeAR8bqkSj6jAADawScxASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRBBwAEkXAASBRmQNuu8f2tO0f5DEQAKA1eRyBPyrpTA6vAwBoQ6aA2x6U9HlJz+YzDgCgVVmPwL8u6TFJv80+CgCgHR0H3Pa9ki5ExIk1nrff9pTtqWq12unmAABNshyB3yXpfttvS/qupM/a/k7zkyLiYERUIqJSLpczbA4AcLWOAx4RYxExGBE7JD0o6ccR8XBukwEAbojrwAEgUb15vEhE/ETST/J4LQBAazgCB4BEEXAASBQBB4BEEXAASBQBB4BEEXAASBQBB4BE5XId+Ho6Oj2v8clZLSzWNNBf0ujIkPbs3l70WABQuK4O+NHpeY1NzKi2dEmSNL9Y09jEjCQRcQCbXlefQhmfnL0c72W1pUsan5wtaCIA6B5dHfCFxVpb6wCwmXR1wAf6S22tA8Bm0tUBHx0ZUqmvZ8Vaqa9HoyNDBU0EAN2jq9/EXH6jkqtQAOBaXR1wqR5xgg0A1+rqUygAgNURcABIFAEHgEQRcABIFAEHgEQRcABIFAEHgER1HHDbt9v+D9tnbP/M9qN5DgYAN4VTh6Wnd0pf6a/fnjqc20tn+SDP+5L+LiJO2v6QpBO2j0XEGznNBgBpO3VYeumAtNT4BXwXz9XvS9KuvZlfvuMj8Ig4HxEnGz//r6QzkvjIJAAsO/7UlXgvW6rV13OQyzlw2zsk7Zb02nUe2297yvZUtVrNY3MAkIaLc+2ttylzwG3/rqR/lfS3EfE/zY9HxMGIqEREpVwuZ90cAKRj62B7623KFHDbfarH+8WImMhlIgC4WQw/IfU1fX9BX6m+noMsV6FY0rcknYmIf8plGgC4mezaK933jLT1dkmu3973TC5vYErZrkK5S9JfSpqx/Xpj7R8j4oeZpwKAm8WuvbkFu1nHAY+I/5TkHGcBALSBT2ICQKIIOAAkioADQKIIOAAkyhGxcRuzq5J+uWEbXB/bJL1T9BBdhP1xBftiJfbHSln2x+9HxDWfhNzQgN8MbE9FRKXoOboF++MK9sVK7I+V1mN/cAoFABJFwAEgUQS8fQeLHqDLsD+uYF+sxP5YKff9wTlwAEgUR+AAkCgCDgCJIuAt4kucr2W7x/a07R8UPUvRbPfbPmL7zcZ/I58qeqai2P5S4+/IaduHbH+w6Jk2ku3nbF+wffqqtY/YPmb7rcbtrXlsi4C3bvlLnP9I0p2S/sb2Hxc8U9EeVf27UCF9Q9KPIuIPJf2JNul+sb1d0gFJlYjYKalH0oPFTrXhnpd0T9Pa45KOR8QnJB1v3M+MgLeIL3FeyfagpM9LerboWYpm+8OSPqP6F5woIt6LiMVChypWr6SS7V5JWyQtFDzPhoqIVyS927T8gKQXGj+/IGlPHtsi4B240Zc4byJfl/SYpN8WPEc3+LikqqRvN04pPWv7lqKHKkJEzEv6mqSzks5LuhgRLxc7VVf4aEScl+oHg5Juy+NFCXib1voS583A9r2SLkTEiaJn6RK9kj4p6ZsRsVvSb5TTP5FT0zi3+4CkOyQNSLrF9sPFTnXzIuBt4EucL7tL0v2235b0XUmftf2dYkcq1JykuYhY/hfZEdWDvhl9TtIvIqIaEUuSJiR9uuCZusGvbX9Mkhq3F/J4UQLeIr7E+YqIGIuIwYjYofobVD+OiE17lBURv5J0zvZQY2lY0hsFjlSks5LutL2l8XdmWJv0Dd0m35e0r/HzPknfy+NFs3yp8WbDlzjjRr4o6UXbH5D0c0lfKHieQkTEa7aPSDqp+pVb09pkH6m3fUjSn0naZntO0pOSvirpsO1HVP+f3F/ksi0+Sg8AaeIUCgAkioADQKIIOAAkioADQKIIOAAkioADQKIIOAAk6v8BE0uvwlE7yRkAAAAASUVORK5CYII=\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plt.scatter(x1,y1)\n", + "plt.scatter(x2,y2)\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "id": "7e839813", + "metadata": {}, + "source": [ + "Similarly we can change the styles of plots using **style** from metplotlib library. Different types of styes and their commands are available in metplotlib library." + ] + }, + { + "cell_type": "markdown", + "id": "eaadfca8", + "metadata": {}, + "source": [ + "*for example:*we can change style of the graph using **ggplot** as follows" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "f51ca17c", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXAAAAD4CAYAAAD1jb0+AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/YYfK9AAAACXBIWXMAAAsTAAALEwEAmpwYAAASR0lEQVR4nO3dX2hT5x/H8U9szKZmrW1PXRb/IN0qw6EdY07ZcBYNY4yJXpWtdSBDhlYQa3GKGw71YmWstggtCgMdo7vwQtspepPJ9MKb2jLp1KlsKkLJ1tg6G62tMfld6K9dtLVNctLTZ32/7vI0yfnmS/349MlzznHF4/G4AADGmeR0AQCA1BDgAGAoAhwADEWAA4ChCHAAMBQBDgCGco/1ATs6Osb6kLayLEvhcNjpMsYN+jGIXiSiH4nS6Yff7x9ynBk4ABiKAAcAQxHgAGAoAhwADEWAA4ChxnwXiqlCkX41ng8rEu2Q1y2VF1vyeT1OlwVgnIt1hqTmRnXd7VFs2gvSqnJNKvDZ8t4E+CiEIv366uebCkUeDIxdCfdq14rZhDiAYcU6Q4rX7pQ6QxpIjz8vK1a525YQZwllFBrPhxPCW5JCkQdqPM8eVwDP0NwodYYSxx7PyO1AgI9C970HQ4/3Dj0OAJIUv92V1HiyCPBRyJ06eejxKUOPA4AkuabnJTWeLAJ8FB59YZkY1j7vZJUXWw5VBMAIq8qlJ9e6C3yPxm3Al5ij4PN6tGvF7Me7UFzyuuPsQgEwokkFPsUqd0vNjXLf7VGUXSjO8Hk9qnrHzwV6ACRlUoFPWlelvAxkB0soAGAoAhwADEWAA4ChCHAAMBQBDgCGIsABwFAEOAAYasQAb2ho0Lp161RVVfXUz3766SeVlpbqzp07GSkOADC8EQO8pKREO3bseGo8HA6rvb1dlsXp5ADghBEDfP78+fJ6vU+Nf//99yovL5fL5cpIYQCAZ0vpVPpz584pLy9Pc+fOHfG5wWBQwWBQklRdXW38jN3tdhv/GexEPwbRi0T0I1Em+pF0gPf19enIkSP68ssvR/X8QCCgQCAw8Nj064hwLZRE9GMQvUhEPxKl0w+/3z/keNK7UP766y/9/fff2rp1qzZu3Khbt25p27Ztun37dkqFAQBSk/QMfM6cOfruu+8GHm/cuFFff/21srOzbS0MAPBsIwZ4XV2dLl68qJ6eHq1fv16lpaVavnz5WNQGAHiGEQN88+bNz/x5fX29XbUAAJLAmZgAYCgCHAAMRYADgKEIcAAwFAEOAIYiwAHAUAQ4ABiKAAcAQxHgAGAoAhwADEWAA4ChCHAAMBQBDgCGIsABwFAEOAAYigAHAEMR4ABgKAIcAAxFgAOAoQhwADAUAQ4AhiLAAcBQ7pGe0NDQoLa2NuXk5KimpkaS9MMPP6i1tVVut1svvviiKioqNG3atIwXCwAYNOIMvKSkRDt27EgYW7hwoWpqavTtt9/qpZde0tGjRzNWIABgaCMG+Pz58+X1ehPGiouLlZWVJUmaN2+eurq6MlMdAGBYIy6hjOTUqVN6++23h/15MBhUMBiUJFVXV8uyrHQP6Si32238Z7AT/RhELxLRj0SZ6EdaAX7kyBFlZWVp6dKlwz4nEAgoEAgMPA6Hw+kc0nGWZRn/GexEPwbRi0T0I1E6/fD7/UOOp7wL5ZdfflFra6s2bdokl8uV6tsAAFKUUoD/+uuvam5u1rZt2/Tcc8/ZXRMAYBRGXEKpq6vTxYsX1dPTo/Xr16u0tFRHjx5VNBrVnj17JElFRUX67LPPMl4sAGDQiAG+efPmp8aWL1+eiVoAAEngTEwAMBQBDgCGIsABwFAEOAAYigAHAEMR4ABgqLSvhQJMdLHOkNTcqK67PYpNe0FaVa5JBT6ny8IEQIADaYh1hhSv3Sl1hvTg/4N/XlascjchjoxjCQVIR3Oj1BlKHHs8IwcyjQAH0hC/PfS18IcbB+xEgANpcE3PS2ocsBMBDqRjVbn05Fp3ge/ROJBhfIkJpGFSgU+xyt1Sc6Pcd3sUZRcKxhABDqRpUoFPWlelPO5AgzHGEgoAGIoABwBDEeAAYCgCHAAMRYADgKEIcAAwFAEOAIYacR94Q0OD2tralJOTo5qaGklSJBJRbW2tOjs7VVBQoMrKSnm93owXCwAYNOIMvKSkRDt27EgYa2pq0oIFC7Rv3z4tWLBATU1NmaoPADCMEQN8/vz5T82uW1patGzZMknSsmXL1NLSkpnqAADDSulU+n/++Ue5ubmSpNzcXN25c2fY5waDQQWDQUlSdXW1LMtK5ZDjhtvtNv4z2Il+DKIXiehHokz0I+PXQgkEAgoEAgOPTb9WhMX1LhLQj0H0IhH9SJROP/x+/5DjKe1CycnJUXd3tySpu7tb2dnZKRUFAEhdSgH+5ptv6vTp05Kk06dPa9GiRbYWBQAY2YhLKHV1dbp48aJ6enq0fv16lZaWavXq1aqtrdWpU6dkWZa2bNkyFrUCAP5lxADfvHnzkOM7d+60uxYAQBI4ExMADEWAA4ChCHAAMBQBDgCGIsABwFAEOAAYigAHAEMR4ABgKAIcAAxFgAOAoQhwADAUAQ4AhiLAAcBQBDgAGIoABwBDEeAAYCgCHAAMRYADgKEIcAAwFAEOAIYiwAHAUAQ4ABjKnc6Ljx8/rlOnTsnlcmn27NmqqKiQx+OxqzbACKFIvxrPhxWJdsjrlsqLLfm8/DtA5qUc4F1dXTp58qRqa2vl8Xi0d+9enT17ViUlJTaWB4xvoUi/vvr5pkKRBwNjV8K92rViNiGOjEtrCSUWi6m/v18PHz5Uf3+/cnNz7aoLMELj+XBCeEtSKPJAjefDDlWEiSTlGXheXp5WrlypDRs2yOPxqLi4WMXFxU89LxgMKhgMSpKqq6tlWVbq1Y4Dbrfb+M9gp4nej0i0Y5hx14Tui8TvxpMy0Y+UAzwSiailpUX19fWaOnWq9u7dqzNnzujdd99NeF4gEFAgEBh4HA6bPTOxLMv4z2Cnid4P7zD/grzu+ITui8TvxpPS6Yff7x9yPOUllPb2ds2YMUPZ2dlyu91avHixrly5kurbAUZ69IXl5IQxn3eyyouZeSLzUp6BW5alq1evqq+vTx6PR+3t7Xr55ZftrA0Y93xej3atmP14F4pLXnecXSgYMykHeFFRkZYsWaJt27YpKytLc+fOTVgqASYKn9ejqnf8LBlgzKW1D7y0tFSlpaV21QIASAJnYgKAoQhwADAUAQ4AhiLAAcBQBDgAGIoABwBDpbWNEBNXrDMkNTeq626PYtNekFaVa1KBz+mygAmFAEfSYp0hxWt3Sp0hDVyH78/LilXuJsSBMcQSCpLX3Ch1hhLHHs/IAYwdAhxJi9/uSmocQGYQ4Eiaa3peUuMAMoMAR/JWlUtPrnUX+B6NAxgzfImJpE0q8ClWuVtqbpT7bo+i7EIBHEGAIyWTCnzSuirlcQlVwDEsoQCAoQhwADAUAQ4AhiLAAcBQBDgAGIoABwBDEeAAYKi09oHfvXtX+/fv182bN+VyubRhwwbNmzfPrtoAAM+QVoAfPHhQr7/+uqqqqhSNRtXX12dXXQCAEaS8hHLv3j1dunRJy5cvlyS53W5NmzbNtsIAAM/misfj8VReeP36dR04cECzZs3SjRs3VFhYqLVr1+r5559PeF4wGFQwGJQkVVdXq7+/P/2qHeR2uxWNRp0uY9ygH4PoRSL6kSidfng8niHHUw7wP/74Q1988YX27NmjoqIiHTx4UFOmTNFHH330zNd1dHSkcrhxw+LaHwnoxyB6kYh+JEqnH36/f8jxlJdQ8vPzlZ+fr6KiIknSkiVLdO3atVTfDgCQpJQDfPr06crPzx+YUbe3t2vWrFm2FQYAeLa0dqF8+umn2rdvn6LRqGbMmKGKigq76gIAjCCtAJ87d66qq6vtqgUAkATOxAQAQxHgAGAoAhwADEWAA4ChCHAAMBQBDgCGIsABwFAEOAAYigAHAEMR4ABgKAIcAAxFgAOAoQhwADAUAQ4AhiLAAcBQBDgAGIoABwBDEeAAYCgCHAAMRYADgKEIcAAwVNoBHovF9Pnnn3N3egAYY2kH+IkTJzRz5kw7agEAJCGtAL9165ba2tq0YsUKu+oBAIxSWgF+6NAhrVmzRi6Xy656AACj5E71ha2trcrJyVFhYaEuXLgw7POCwaCCwaAkqbq6WpZlpXrIccHtdhv/GexEPwbRi0T0I1Em+uGKx+PxVF74448/6syZM8rKylJ/f796e3v11ltvadOmTc98XUdHR0qFjheWZSkcDjtdxrhBPwbRi0T0I1E6/fD7/UOOpzwDLysrU1lZmSTpwoULOnbs2IjhDQCwD/vAAcBQKc/A/+21117Ta6+9ZsdbAQBGiRk4ABiKAAcAQxHgAGAoAhwADEWAA4ChCHAAMBQBDgCGsmUfeCbFOkNSc6Pit7vkmp4nrSrXpAKf02UBgOPGdYDHOkOK1+6UOkOSpLgk/XlZscrdhDiACW98L6E0Nw6E94DHM3IAmOjGdYDHb3clNQ4AE8m4DnDX9LykxgFgIhnXAa5V5dKTa90FvkfjADDBjesvMScV+BSr3M0uFAAYwrgOcOlRiGtdldNlAMC4M76XUAAAwyLAAcBQBDgAGIoABwBDEeAAYCgCHAAMRYADgKFS3gceDodVX1+v27dvy+VyKRAI6IMPPrCzNgAwXijSr8bzYUWiHfK6pfJiSz6vx5b3TjnAs7Ky9Mknn6iwsFC9vb3avn27Fi5cqFmzZtlSGACYLhTp11c/31Qo8mBg7Eq4V7tWzLYlxFNeQsnNzVVhYaEkacqUKZo5c6a6urhKIAD8X+P5cEJ4S1Io8kCN58O2vL8tp9L//fffunbtml555ZWnfhYMBhUMBiVJ1dXVsizLjkM6xu12G/8Z7EQ/BtGLRPRDikQ7hhl32dKbtAP8/v37qqmp0dq1azV16tSnfh4IBBQIBAYeh8P2/M/jFMuyjP8MdqIfg+hFIvoheYdJWK87nlRv/H7/kONp7UKJRqOqqanR0qVLtXjx4nTeCgD+cx59YTk5YcznnazyYnv+Mkl5Bh6Px7V//37NnDlTH374oS3FAMB/ic/r0a4Vsx/vQnHJ646Pj10oly9f1pkzZzRnzhxt3bpVkvTxxx/rjTfesKUwAPgv8Hk9qnrHn5ElpZQD/NVXX9Xhw4ftrAUAkATOxAQAQxHgAGAoAhwADEWAA4ChXPF4PO50EQCA5DEDT9L27dudLmFcoR+D6EUi+pEoE/0gwAHAUAQ4ABiKAE/Svy/MBfrxb/QiEf1IlIl+8CUmABiKGTgAGIoABwBD2XJHnomAmzg/LRaLafv27crLy5vwW8bu3r2r/fv36+bNm3K5XNqwYYPmzZvndFmOOH78uE6dOiWXy6XZs2eroqJCHo89l081QUNDg9ra2pSTk6OamhpJUiQSUW1trTo7O1VQUKDKykp5vd60j0WAjxI3cX7aiRMnNHPmTPX29jpdiuMOHjyo119/XVVVVYpGo+rr63O6JEd0dXXp5MmTqq2tlcfj0d69e3X27FmVlJQ4XdqYKSkp0fvvv6/6+vqBsaamJi1YsECrV69WU1OTmpqatGbNmrSPxRLKKHET50S3bt1SW1ubVqxY4XQpjrt3754uXbqk5cuXS3p0L8hp06Y5XJVzYrGY+vv79fDhQ/X39ys3N9fpksbU/Pnzn5pdt7S0aNmyZZKkZcuWqaWlxZZjMQNPwbNu4jxRHDp0SGvWrGH2rUe/D9nZ2WpoaNCNGzdUWFiotWvX6vnnn3e6tDGXl5enlStXasOGDfJ4PCouLlZxcbHTZTnun3/+GfiPLDc3V3fu3LHlfZmBJ2mkmzhPBK2trcrJyRn4i2Sie/jwoa5du6b33ntP33zzjZ577jk1NTU5XZYjIpGIWlpaVF9frwMHDuj+/fs6c+aM02X9ZxHgSeAmzo9cvnxZ586d08aNG1VXV6fffvtN+/btc7osx+Tn5ys/P19FRUWSpCVLlujatWsOV+WM9vZ2zZgxQ9nZ2XK73Vq8eLGuXLnidFmOy8nJUXd3tySpu7tb2dnZtrwvSyijxE2cB5WVlamsrEySdOHCBR07dkybNm1yuCrnTJ8+Xfn5+ero6JDf71d7e/uE/XLbsixdvXpVfX198ng8am9v18svv+x0WY578803dfr0aa1evVqnT5/WokWLbHlfzsQcpd9//107d+7UnDlz5HK5JHETZ2kwwCf6NsLr169r//79ikajmjFjhioqKmzZJmaiw4cP6+zZs8rKytLcuXO1fv16TZ482emyxkxdXZ0uXryonp4e5eTkqLS0VIsWLVJtba3C4bAsy9KWLVts+f0gwAHAUKyBA4ChCHAAMBQBDgCGIsABwFAEOAAYigAHAEMR4ABgqP8BiIEhR5MU4EwAAAAASUVORK5CYII=\n", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from matplotlib import style\n", + "plt.scatter(x1,y1)\n", + "plt.scatter(x2,y2)\n", + "style.use('ggplot') #changes the appearance of the graph\n", + "plt.show()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/Numpy Notebook.ipynb b/Numpy Notebook.ipynb new file mode 100644 index 0000000..99bf394 --- /dev/null +++ b/Numpy Notebook.ipynb @@ -0,0 +1,544 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "7021de6b", + "metadata": {}, + "source": [ + "# NumPy\n", + "NumPy is a Python Library which offers a range of mathematical functions.\n", + "NumPy has a syntax which is simultaneously compact, powerful and expressive. It allows users to manage data in vectors, matrices and higher dimensional arrays." + ] + }, + { + "cell_type": "markdown", + "id": "8793bb24", + "metadata": {}, + "source": [ + "# Creating an Array using NumPy" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "adb1b0d8", + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np #imports numpy" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "91dd7ac5", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[1 2 3 4]\n", + "[[ 1 2 3 0]\n", + " [ 4 5 6 14]\n", + " [12 13 15 16]\n", + " [11 7 9 10]]\n" + ] + } + ], + "source": [ + "x = np.array([1,2,3,4]) #defining 1-D array\n", + "print(x)\n", + "y = np.array([[1,2,3,0],[4,5,6,14],[12,13,15,16],[11,7,9,10]]) #defining 2-D array\n", + "print(y)" + ] + }, + { + "cell_type": "markdown", + "id": "83438bad", + "metadata": {}, + "source": [ + "## Functions on Array" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "34856324", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(4,)" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "x.shape #shape function returns number of rows and colums of an array" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "6ed676e8", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(4, 4)" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y.shape" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "7ace46b9", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "dtype('int32')" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y.dtype #dtype function returns data type of the array" + ] + }, + { + "cell_type": "markdown", + "id": "673ff55f", + "metadata": {}, + "source": [ + "#### Function to Acess Elements at Specific Index" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "649c0632", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "5" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y[1,1] #gives element at index (1,1) i.e. Row 1 Column 1 in array y" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "8e1507b8", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([12, 13, 15, 16])" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y[2,:] #This will return all elements of row 2 in the form of array" + ] + }, + { + "cell_type": "markdown", + "id": "07f7f184", + "metadata": {}, + "source": [ + "#### Intialising arrays using some in-built functions" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "ab2ffdfb", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[0. 0. 0. 0.]]\n" + ] + } + ], + "source": [ + "zeros = np.zeros((1,4)) #This function will generate an array with 1 row and 4 columns with all 0 values.\n", + "print(zeros)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "b32c6c10", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[1. 1. 1. 1. 1.]\n", + " [1. 1. 1. 1. 1.]]\n" + ] + } + ], + "source": [ + "one = np.ones((2,5)) #This function will generate an array with 2 row and 5 columns with all 1 values.\n", + "print(one)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "64437759", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[0.85191043 0.92657634]\n", + " [0.80535181 0.92194349]]\n" + ] + } + ], + "source": [ + "random = np.random.rand(2,2) #This function will generate an array with 2 row and 2 columns all random elements.\n", + "print(random)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "1d1842cc", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[1. 0. 0.]\n", + " [0. 1. 0.]\n", + " [0. 0. 1.]]\n" + ] + } + ], + "source": [ + "id = np.identity(3) ##This function will generate an Identity Matrix with 3 row and 3 columns.\n", + "print(id)" + ] + }, + { + "cell_type": "markdown", + "id": "331733a0", + "metadata": {}, + "source": [ + "#### Scalar Operations on 2D Matrix" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "678f2f88", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[ 3 4 5 2]\n", + " [ 6 7 8 16]\n", + " [14 15 17 18]\n", + " [13 9 11 12]]\n", + "[[-3 -2 -1 -4]\n", + " [ 0 1 2 10]\n", + " [ 8 9 11 12]\n", + " [ 7 3 5 6]]\n", + "[[ 3 6 9 0]\n", + " [12 15 18 42]\n", + " [36 39 45 48]\n", + " [33 21 27 30]]\n", + "[[0.5 1. 1.5 0. ]\n", + " [2. 2.5 3. 7. ]\n", + " [6. 6.5 7.5 8. ]\n", + " [5.5 3.5 4.5 5. ]]\n", + "[[ 1 4 9 0]\n", + " [ 16 25 36 196]\n", + " [144 169 225 256]\n", + " [121 49 81 100]]\n" + ] + } + ], + "source": [ + "print(y+2) # perform arithematic operaions on all the values of the matrix\n", + "print(y-4)\n", + "print(y*3)\n", + "print(y/2)\n", + "print(y**2)" + ] + }, + { + "cell_type": "markdown", + "id": "273b57e3", + "metadata": {}, + "source": [ + "#### Matrix Operations" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "7f26f20b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[ 4 8 12]\n", + " [ 5 10 7]\n", + " [ 7 9 2]]\n", + "[[26 20 22]\n", + " [32 52 68]\n", + " [14 30 36]]\n" + ] + } + ], + "source": [ + "s1 = np.array([[1,2,3],[4,6,2],[0,7,1]])\n", + "s2 = np.array([[3,6,9],[1,4,5],[7,2,1]])\n", + "\n", + "print(s1+s2) #performs matrix addition\n", + "p = np.matmul(s1,s2)\n", + "print(p) #performs matrix multiplication between s1 and s2" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "96432d4e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "np.min(s2) # returns min value in s2" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "e4e2a3b6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "9" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "np.max(s2) # returns max value in s2" + ] + }, + { + "cell_type": "markdown", + "id": "d45038dc", + "metadata": {}, + "source": [ + "#### Concept Of Axis in Arrays.\n", + "A 1D array has only 1 Axis (Axis 0) along its row. \n", + "A 2D array has 2 Axis (Axis 0, Axis 1) Axis 1 along its row and Axis 0 along its columns." + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "c279e1d9", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([11, 12, 15])" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "np.sum(s2,axis=0) #To add all elements of a column" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "b4e7b247", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([18, 10, 10])" + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "np.sum(s2,axis=1) #To add all elements of a row" + ] + }, + { + "cell_type": "markdown", + "id": "9ef08b34", + "metadata": {}, + "source": [ + "### Changing shape of an array" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "fcacdaf8", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[1]\n", + " [2]\n", + " [3]\n", + " [4]\n", + " [6]\n", + " [2]\n", + " [0]\n", + " [7]\n", + " [1]]\n", + "[[3 6 9]\n", + " [1 4 5]\n", + " [7 2 1]]\n" + ] + } + ], + "source": [ + "w1 = s1\n", + "print(w1.reshape(9,1)) #reshapes w1 into 9X1 Matrix\n", + "print(s2)" + ] + }, + { + "cell_type": "markdown", + "id": "5bcb8dd8", + "metadata": {}, + "source": [ + "#### Transpose of the Matrix." + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "c5e67278", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([[1, 4, 0],\n", + " [2, 6, 7],\n", + " [3, 2, 1]])" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "s1.T" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f81dd554", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/Pandas Notebook.ipynb b/Pandas Notebook.ipynb new file mode 100644 index 0000000..c6f6fde --- /dev/null +++ b/Pandas Notebook.ipynb @@ -0,0 +1,826 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "f6826b4a", + "metadata": {}, + "source": [ + "# Pandas" + ] + }, + { + "cell_type": "markdown", + "id": "862d71bf", + "metadata": {}, + "source": [ + "Pandas is an open source library. It is a fast, powerful, flexible and easy to use open source data analysis and manipulation tool, built on top of the Python programming language. \n", + "It let's us work with spreadsheets along with using latest Python libraries and functions." + ] + }, + { + "cell_type": "markdown", + "id": "d5210d68", + "metadata": {}, + "source": [ + "## Working with Pandas" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "cdf73667", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd #imports pandas" + ] + }, + { + "cell_type": "markdown", + "id": "554cc57c", + "metadata": {}, + "source": [ + "##### Pandas has two types of data structures:\n", + "#### Series:\n", + "It is a one dimensional array with indexes, it stores a single column or row od data in a datasheet. \n", + "#### DataFrame:\n", + "Its a tabular spreadsheet like structure representing rows each of which contains one or nultiple columns." + ] + }, + { + "cell_type": "markdown", + "id": "e6162491", + "metadata": {}, + "source": [ + "### Creating a Pandas series" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "ec9b65fd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0 13\n", + "1 24\n", + "2 36\n", + "dtype: int64" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "y = [13, 24, 36] #creating a python list\n", + "s = pd.Series(y) #converting python list into series\n", + "s" + ] + }, + { + "cell_type": "markdown", + "id": "9ba393cf", + "metadata": {}, + "source": [ + "### Creating Pandas DataFrame" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "id": "03ce33eb", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " Name Age University Specialization\n", + "0 Neil 23 BHU Mathematics\n", + "1 Aishwarya 21 PU Biology\n", + "2 Rahul 22 DU Physics\n", + "3 Shivani 21 BHU Chemistry\n", + "4 Namrata 20 IIT Accountancy\n", + "5 Pawan 22 MU Mathematics\n", + "6 Karan 22 JNU Bio-Chemistry\n", + "7 Krish 23 MU Astrophysics\n" + ] + } + ], + "source": [ + "# Let us consider a dictionary\n", + "exa = {\n", + " 'Name' : ['Neil', 'Aishwarya', 'Rahul', 'Shivani','Namrata','Pawan', 'Karan','Krish'],\n", + " 'Age' : [23, 21, 22, 21, 20, 22, 22, 23],\n", + " 'University' : ['BHU', 'PU', 'DU', 'BHU', 'IIT', 'MU', 'JNU', 'MU'],\n", + " 'Specialization' : ['Mathematics' , 'Biology', 'Physics' , 'Chemistry', 'Accountancy', 'Mathematics', 'Bio-Chemistry', 'Astrophysics']}\n", + "df = pd.DataFrame(exa) # pd.DataFrame() converts dictionary into a data frame\n", + "print(df) #prints the data frame" + ] + }, + { + "cell_type": "markdown", + "id": "97331558", + "metadata": {}, + "source": [ + "### We can also convert this DataFrame into .csv file which can be opened in Excel sheets by the following command.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "id": "7a08bc06", + "metadata": {}, + "outputs": [], + "source": [ + "df.to_csv(\"nameofthefile.csv\") #creates a excel file on the system." + ] + }, + { + "cell_type": "markdown", + "id": "0b24574a", + "metadata": {}, + "source": [ + "Sometimes we just want to have access to only few rows of the dataframe, in these cases we can use **head()** or **tail()** function." + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "id": "72528c26", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NameAgeUniversitySpecialization
0Neil23BHUMathematics
1Aishwarya21PUBiology
2Rahul22DUPhysics
\n", + "
" + ], + "text/plain": [ + " Name Age University Specialization\n", + "0 Neil 23 BHU Mathematics\n", + "1 Aishwarya 21 PU Biology\n", + "2 Rahul 22 DU Physics" + ] + }, + "execution_count": 36, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.head(3) #prints only top 3 rows of the dataframe" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "id": "10d6b8c4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NameAgeUniversitySpecialization
6Karan22JNUBio-Chemistry
7Krish23MUAstrophysics
\n", + "
" + ], + "text/plain": [ + " Name Age University Specialization\n", + "6 Karan 22 JNU Bio-Chemistry\n", + "7 Krish 23 MU Astrophysics" + ] + }, + "execution_count": 37, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.tail(2) #prints only last 2 rows of the dataframe" + ] + }, + { + "cell_type": "markdown", + "id": "dca4f23f", + "metadata": {}, + "source": [ + "### We can also access excel files in the Notebook with the following command. \n", + "Assume there's an excel.csv file on the system. it can be opened on the notebook by following command. " + ] + }, + { + "cell_type": "markdown", + "id": "f859d5f3", + "metadata": {}, + "source": [ + "pd.read_csv('salaries.csv') \n", + "##### opens an excel file named salaries from the system" + ] + }, + { + "cell_type": "markdown", + "id": "0b09d812", + "metadata": {}, + "source": [ + "##### We can access any column of the DataFrame by following command:" + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "id": "d0ba9156", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0 23\n", + "1 21\n", + "2 22\n", + "3 21\n", + "4 20\n", + "5 22\n", + "6 22\n", + "7 23\n", + "Name: Age, dtype: int64" + ] + }, + "execution_count": 39, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Age'] #prints age column only as an index of the dataframe." + ] + }, + { + "cell_type": "code", + "execution_count": 42, + "id": "bd41d921", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "22" + ] + }, + "execution_count": 42, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['Age'][2] #prints element of column age indexed 2." + ] + }, + { + "cell_type": "markdown", + "id": "ad8cd4e2", + "metadata": {}, + "source": [ + "###### We can also change the index of the dataframe like this:" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "734cf8e3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
NameAgeUniversitySpecialization
1Neil23BHUMathematics
2Aishwarya21PUBiology
3Rahul22DUPhysics
4Shivani21BHUChemistry
5Namrata20IITAccountancy
6Pawan22MUMathematics
7Karan22JNUBio-Chemistry
8Krish23MUAstrophysics
\n", + "
" + ], + "text/plain": [ + " Name Age University Specialization\n", + "1 Neil 23 BHU Mathematics\n", + "2 Aishwarya 21 PU Biology\n", + "3 Rahul 22 DU Physics\n", + "4 Shivani 21 BHU Chemistry\n", + "5 Namrata 20 IIT Accountancy\n", + "6 Pawan 22 MU Mathematics\n", + "7 Karan 22 JNU Bio-Chemistry\n", + "8 Krish 23 MU Astrophysics" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.index = [1,2,3,4,5,6,7,8] # specifying the desired index.\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 46, + "id": "fff76743", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Int64Index: 8 entries, 1 to 8\n", + "Data columns (total 4 columns):\n", + " # Column Non-Null Count Dtype \n", + "--- ------ -------------- ----- \n", + " 0 Name 8 non-null object\n", + " 1 Age 8 non-null int64 \n", + " 2 University 8 non-null object\n", + " 3 Specialization 8 non-null object\n", + "dtypes: int64(1), object(3)\n", + "memory usage: 320.0+ bytes\n" + ] + } + ], + "source": [ + "df.info() #data summary " + ] + }, + { + "cell_type": "markdown", + "id": "f6ee85ad", + "metadata": {}, + "source": [ + "##### We can also calculate the statistical summary of the data using .describe() " + ] + }, + { + "cell_type": "code", + "execution_count": 47, + "id": "b4f80f3e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Age
count8.000000
mean21.750000
std1.035098
min20.000000
25%21.000000
50%22.000000
75%22.250000
max23.000000
\n", + "
" + ], + "text/plain": [ + " Age\n", + "count 8.000000\n", + "mean 21.750000\n", + "std 1.035098\n", + "min 20.000000\n", + "25% 21.000000\n", + "50% 22.000000\n", + "75% 22.250000\n", + "max 23.000000" + ] + }, + "execution_count": 47, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.describe()" + ] + }, + { + "cell_type": "markdown", + "id": "80c8baea", + "metadata": {}, + "source": [ + "## Some Other Important Functions" + ] + }, + { + "cell_type": "markdown", + "id": "e33844cd", + "metadata": {}, + "source": [ + "##### .loc()\n", + "\n", + "##### Access a group of rows and columns by their name.\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 52, + "id": "099bc2cc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1 BHU\n", + "2 PU\n", + "3 DU\n", + "4 BHU\n", + "5 IIT\n", + "6 MU\n", + "7 JNU\n", + "8 MU\n", + "Name: University, dtype: object" + ] + }, + "execution_count": 52, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[:,'University'] # Prints column labelled 'University'" + ] + }, + { + "cell_type": "code", + "execution_count": 53, + "id": "15b13b8e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Name Aishwarya\n", + "Age 21\n", + "University PU\n", + "Specialization Biology\n", + "Name: 2, dtype: object" + ] + }, + "execution_count": 53, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[2,:] # Prints row labelled '2'" + ] + }, + { + "cell_type": "code", + "execution_count": 54, + "id": "7bdf7088", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'Namrata'" + ] + }, + "execution_count": 54, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.loc[5,'Name'] # Prints element from 'Name' column and 5 row" + ] + }, + { + "cell_type": "markdown", + "id": "78fddb65", + "metadata": {}, + "source": [ + "##### .iloc()\n", + "\n", + "##### Access a group of rows and columns by their index.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 55, + "id": "c4fdf666", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1 Mathematics\n", + "2 Biology\n", + "3 Physics\n", + "4 Chemistry\n", + "5 Accountancy\n", + "6 Mathematics\n", + "7 Bio-Chemistry\n", + "8 Astrophysics\n", + "Name: Specialization, dtype: object" + ] + }, + "execution_count": 55, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.iloc[:,3] # Prints column indexed 3" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "ebcd6699", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Name Shivani\n", + "Age 21\n", + "University BHU\n", + "Specialization Chemistry\n", + "Name: 4, dtype: object" + ] + }, + "execution_count": 56, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.iloc[3,:] # Prints row indexed 3" + ] + }, + { + "cell_type": "code", + "execution_count": 57, + "id": "87775bc7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'Astrophysics'" + ] + }, + "execution_count": 57, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.iloc[7,3] # Prints element at intersection of 7 indexed row and 3 indexed column." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "84cde1a0", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +}