{ "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import opendatasets as od" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Downloading mpst-movie-plot-synopses-with-tags.zip to .\\mpst-movie-plot-synopses-with-tags\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "100%|██████████| 28.8M/28.8M [00:07<00:00, 3.81MB/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "\n" ] } ], "source": [ "od.download('https://www.kaggle.com/datasets/cryptexcode/mpst-movie-plot-synopses-with-tags')" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "df = pd.read_csv('mpst-movie-plot-synopses-with-tags\\mpst_full_data.csv')" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | imdb_id | \n", "title | \n", "plot_synopsis | \n", "tags | \n", "split | \n", "synopsis_source | \n", "
---|---|---|---|---|---|---|
0 | \n", "tt0057603 | \n", "I tre volti della paura | \n", "Note: this synopsis is for the orginal Italian... | \n", "cult, horror, gothic, murder, atmospheric | \n", "train | \n", "imdb | \n", "
1 | \n", "tt1733125 | \n", "Dungeons & Dragons: The Book of Vile Darkness | \n", "Two thousand years ago, Nhagruul the Foul, a s... | \n", "violence | \n", "train | \n", "imdb | \n", "
2 | \n", "tt0033045 | \n", "The Shop Around the Corner | \n", "Matuschek's, a gift store in Budapest, is the ... | \n", "romantic | \n", "test | \n", "imdb | \n", "
3 | \n", "tt0113862 | \n", "Mr. Holland's Opus | \n", "Glenn Holland, not a morning person by anyone'... | \n", "inspiring, romantic, stupid, feel-good | \n", "train | \n", "imdb | \n", "
4 | \n", "tt0086250 | \n", "Scarface | \n", "In May 1980, a Cuban man named Tony Montana (A... | \n", "cruelty, murder, dramatic, cult, violence, atm... | \n", "val | \n", "imdb | \n", "