! apt-get update
! apt-get install g++ openjdk-8-jdk
! pip3 install nltk konlpy matplotlib gensim
! apt-get install fonts-nanum-eco
! apt-get install fontconfig
! fc-cache -fv
! cp /usr/share/fonts/truetype/nanum/Nanum* /usr/local/lib/python3.6/dist-packages/matplotlib/mpl-data/fonts/ttf/
! rm -rf /content/.cache/matplotlib/*
import nltk
nltk.download('wordnet')
import pandas as pd
import io, requests
url = "https://raw.githubusercontent.com/YongBeomKim/nltk_basic/master/data/movies_metadata.csv"
response = requests.get(url).content
movies = pd.read_csv(io.StringIO(response.decode('utf-8')),
usecols=['original_title', 'overview', 'title'], low_memory=False)
movies = movies.dropna(axis=0)
movies.shape
movie_plot_li = movies['overview']
movie_info_li = movies['title']
movies.head(3)