{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"#! pip install -r ../requirements.txt"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"links = pd.read_csv('../data/links.csv', index_col='movieId') # ids do filme y nas plataformas imdb e tmdb, util para enriquecer os dados\n",
"movies = pd.read_csv('../data/movies_m100_u10.csv', index_col='movieId') # dados do filme y\n",
"ratings = pd.read_csv('../data/ratings_m100_u10.csv', index_col='movieId') # avaliacao do usuario x pro filme y\n",
"tags = pd.read_csv('../data/tags.csv', index_col='movieId') # n parece mto relevante"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" imdbId | \n",
" tmdbId | \n",
"
\n",
" \n",
" movieId | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
" 1 | \n",
" 114709 | \n",
" 862.0 | \n",
"
\n",
" \n",
" 2 | \n",
" 113497 | \n",
" 8844.0 | \n",
"
\n",
" \n",
" 3 | \n",
" 113228 | \n",
" 15602.0 | \n",
"
\n",
" \n",
" 4 | \n",
" 114885 | \n",
" 31357.0 | \n",
"
\n",
" \n",
" 5 | \n",
" 113041 | \n",
" 11862.0 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" imdbId tmdbId\n",
"movieId \n",
"1 114709 862.0\n",
"2 113497 8844.0\n",
"3 113228 15602.0\n",
"4 114885 31357.0\n",
"5 113041 11862.0"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"links.head()"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" title | \n",
" genres | \n",
"
\n",
" \n",
" movieId | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
" 1 | \n",
" Toy Story (1995) | \n",
" Adventure|Animation|Children|Comedy|Fantasy | \n",
"
\n",
" \n",
" 2 | \n",
" Jumanji (1995) | \n",
" Adventure|Children|Fantasy | \n",
"
\n",
" \n",
" 6 | \n",
" Heat (1995) | \n",
" Action|Crime|Thriller | \n",
"
\n",
" \n",
" 10 | \n",
" GoldenEye (1995) | \n",
" Action|Adventure|Thriller | \n",
"
\n",
" \n",
" 32 | \n",
" Twelve Monkeys (a.k.a. 12 Monkeys) (1995) | \n",
" Mystery|Sci-Fi|Thriller | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" title \\\n",
"movieId \n",
"1 Toy Story (1995) \n",
"2 Jumanji (1995) \n",
"6 Heat (1995) \n",
"10 GoldenEye (1995) \n",
"32 Twelve Monkeys (a.k.a. 12 Monkeys) (1995) \n",
"\n",
" genres \n",
"movieId \n",
"1 Adventure|Animation|Children|Comedy|Fantasy \n",
"2 Adventure|Children|Fantasy \n",
"6 Action|Crime|Thriller \n",
"10 Action|Adventure|Thriller \n",
"32 Mystery|Sci-Fi|Thriller "
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"movies.head()"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" Unnamed: 0 | \n",
" userId | \n",
" rating | \n",
" timestamp | \n",
"
\n",
" \n",
" movieId | \n",
" | \n",
" | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
" 1 | \n",
" 0 | \n",
" 1 | \n",
" 4.0 | \n",
" 964982703 | \n",
"
\n",
" \n",
" 6 | \n",
" 2 | \n",
" 1 | \n",
" 4.0 | \n",
" 964982224 | \n",
"
\n",
" \n",
" 47 | \n",
" 3 | \n",
" 1 | \n",
" 5.0 | \n",
" 964983815 | \n",
"
\n",
" \n",
" 50 | \n",
" 4 | \n",
" 1 | \n",
" 5.0 | \n",
" 964982931 | \n",
"
\n",
" \n",
" 110 | \n",
" 7 | \n",
" 1 | \n",
" 4.0 | \n",
" 964982176 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Unnamed: 0 userId rating timestamp\n",
"movieId \n",
"1 0 1 4.0 964982703\n",
"6 2 1 4.0 964982224\n",
"47 3 1 5.0 964983815\n",
"50 4 1 5.0 964982931\n",
"110 7 1 4.0 964982176"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"ratings.head()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" userId | \n",
" tag | \n",
" timestamp | \n",
"
\n",
" \n",
" movieId | \n",
" | \n",
" | \n",
" | \n",
"
\n",
" \n",
" \n",
" \n",
" 60756 | \n",
" 2 | \n",
" funny | \n",
" 1445714994 | \n",
"
\n",
" \n",
" 60756 | \n",
" 2 | \n",
" Highly quotable | \n",
" 1445714996 | \n",
"
\n",
" \n",
" 60756 | \n",
" 2 | \n",
" will ferrell | \n",
" 1445714992 | \n",
"
\n",
" \n",
" 89774 | \n",
" 2 | \n",
" Boxing story | \n",
" 1445715207 | \n",
"
\n",
" \n",
" 89774 | \n",
" 2 | \n",
" MMA | \n",
" 1445715200 | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" userId tag timestamp\n",
"movieId \n",
"60756 2 funny 1445714994\n",
"60756 2 Highly quotable 1445714996\n",
"60756 2 will ferrell 1445714992\n",
"89774 2 Boxing story 1445715207\n",
"89774 2 MMA 1445715200"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"tags.head()"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.4"
}
},
"nbformat": 4,
"nbformat_minor": 2
}