Python project

ash659956
STCdataset.ipynb

{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "data": { "text/html": [ "<div>\n", "<style scoped>\n", " .dataframe tbody tr th:only-of-type {\n", " vertical-align: middle;\n", " }\n", "\n", " .dataframe tbody tr th {\n", " vertical-align: top;\n", " }\n", "\n", " .dataframe thead th {\n", " text-align: right;\n", " }\n", "</style>\n", "<table border=\"1\" class=\"dataframe\">\n", " <thead>\n", " <tr style=\"text-align: right;\">\n", " <th></th>\n", " <th>Unnamed: 0</th>\n", " <th>date_</th>\n", " <th>user_id_maped</th>\n", " <th>program_name</th>\n", " <th>duration_seconds</th>\n", " <th>program_class</th>\n", " <th>season</th>\n", " <th>episode</th>\n", " <th>program_desc</th>\n", " <th>program_genre</th>\n", " <th>series_title</th>\n", " <th>hd</th>\n", " <th>original_name</th>\n", " </tr>\n", " </thead>\n", " <tbody>\n", " <tr>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>2017-05-27</td>\n", " <td>26138</td>\n", " <td>100 treets</td>\n", " <td>40</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Drama Movie100 Streets</td>\n", " <td>Drama</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>100 treets</td>\n", " </tr>\n", " <tr>\n", " <td>1</td>\n", " <td>3</td>\n", " <td>2017-05-21</td>\n", " <td>7946</td>\n", " <td>Moana</td>\n", " <td>17</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieMoana (HD)</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>Moana</td>\n", " </tr>\n", " <tr>\n", " <td>2</td>\n", " <td>4</td>\n", " <td>2017-08-10</td>\n", " <td>7418</td>\n", " <td>The Mermaid Princess</td>\n", " <td>8</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieThe Mermaid Princess (HD)</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>The Mermaid Princess</td>\n", " </tr>\n", " <tr>\n", " <td>3</td>\n", " <td>5</td>\n", " <td>2017-07-26</td>\n", " <td>19307</td>\n", " <td>The Mermaid Princess</td>\n", " <td>76</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieThe Mermaid Princess (HD)</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>The Mermaid Princess</td>\n", " </tr>\n", " <tr>\n", " <td>4</td>\n", " <td>7</td>\n", " <td>2017-07-07</td>\n", " <td>15860</td>\n", " <td>Churchill</td>\n", " <td>87</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Biography MovieChurchill (HD)</td>\n", " <td>Biography</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>Churchill</td>\n", " </tr>\n", " <tr>\n", " <td>5</td>\n", " <td>8</td>\n", " <td>2017-08-19</td>\n", " <td>20775</td>\n", " <td>Beavis And Butt-Head Do America</td>\n", " <td>3</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieBeavis And Butt-Head Do America</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Beavis And Butt-Head Do America</td>\n", " </tr>\n", " <tr>\n", " <td>6</td>\n", " <td>9</td>\n", " <td>2017-06-26</td>\n", " <td>11374</td>\n", " <td>The Mermaid Princess</td>\n", " <td>33577</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieThe Mermaid Princess (HD)</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>The Mermaid Princess</td>\n", " </tr>\n", " <tr>\n", " <td>7</td>\n", " <td>10</td>\n", " <td>2018-03-29</td>\n", " <td>6358</td>\n", " <td>Coco</td>\n", " <td>14</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Animation MovieCoco (HD)</td>\n", " <td>Animation</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>Coco</td>\n", " </tr>\n", " <tr>\n", " <td>8</td>\n", " <td>11</td>\n", " <td>2018-01-27</td>\n", " <td>11660</td>\n", " <td>Kidnap</td>\n", " <td>85</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Action MovieKidnap (HD)</td>\n", " <td>Action</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>Kidnap</td>\n", " </tr>\n", " <tr>\n", " <td>9</td>\n", " <td>12</td>\n", " <td>2017-03-30</td>\n", " <td>5155</td>\n", " <td>The Accountant</td>\n", " <td>42</td>\n", " <td>MOVIE</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>Action MovieThe Accountant (HD)</td>\n", " <td>Action</td>\n", " <td>0</td>\n", " <td>1</td>\n", " <td>The Accountant</td>\n", " </tr>\n", " </tbody>\n", "</table>\n", "</div>" ], "text/plain": [ " Unnamed: 0 date_ user_id_maped program_name \\\n", "0 1 2017-05-27 26138 100 treets \n", "1 3 2017-05-21 7946 Moana \n", "2 4 2017-08-10 7418 The Mermaid Princess \n", "3 5 2017-07-26 19307 The Mermaid Princess \n", "4 7 2017-07-07 15860 Churchill \n", "5 8 2017-08-19 20775 Beavis And Butt-Head Do America \n", "6 9 2017-06-26 11374 The Mermaid Princess \n", "7 10 2018-03-29 6358 Coco \n", "8 11 2018-01-27 11660 Kidnap \n", "9 12 2017-03-30 5155 The Accountant \n", "\n", " duration_seconds program_class season episode \\\n", "0 40 MOVIE 0 0 \n", "1 17 MOVIE 0 0 \n", "2 8 MOVIE 0 0 \n", "3 76 MOVIE 0 0 \n", "4 87 MOVIE 0 0 \n", "5 3 MOVIE 0 0 \n", "6 33577 MOVIE 0 0 \n", "7 14 MOVIE 0 0 \n", "8 85 MOVIE 0 0 \n", "9 42 MOVIE 0 0 \n", "\n", " program_desc program_genre series_title \\\n", "0 Drama Movie100 Streets Drama 0 \n", "1 Animation MovieMoana (HD) Animation 0 \n", "2 Animation MovieThe Mermaid Princess (HD) Animation 0 \n", "3 Animation MovieThe Mermaid Princess (HD) Animation 0 \n", "4 Biography MovieChurchill (HD) Biography 0 \n", "5 Animation MovieBeavis And Butt-Head Do America Animation 0 \n", "6 Animation MovieThe Mermaid Princess (HD) Animation 0 \n", "7 Animation MovieCoco (HD) Animation 0 \n", "8 Action MovieKidnap (HD) Action 0 \n", "9 Action MovieThe Accountant (HD) Action 0 \n", "\n", " hd original_name \n", "0 0 100 treets \n", "1 1 Moana \n", "2 1 The Mermaid Princess \n", "3 1 The Mermaid Princess \n", "4 1 Churchill \n", "5 0 Beavis And Butt-Head Do America \n", "6 1 The Mermaid Princess \n", "7 1 Coco \n", "8 1 Kidnap \n", "9 1 The Accountant " ] }, "execution_count": 1, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import pandas as pd\n", "\n", "df = pd.read_csv(\"Final_Dataset.txt\")\n", "df.head()" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(3598607, 13)" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.shape" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.4" } }, "nbformat": 4, "nbformat_minor": 2 }