#!/usr/bin/env python # coding: utf-8 # In[6]: import pandas as pd import numpy as np import matplotlib.pyplot as plt get_ipython().run_line_magic('matplotlib', 'inline') plt.style.use('ggplot') # check if config exists try: config except NameError: config_exists = False else: config_exists = True # make config if it does not exist already (e.g. passed in by papermill) if not(config_exists): # set up some config for the experiment run config = { "data_url" : "https://raw.githubusercontent.com/andrewm4894/papermill_dev/master/data/titanic.csv", } print(config) # In[7]: df = pd.read_csv(config['data_url']) print(df.shape) df.head() # In[8]: df.describe() # In[9]: for col in df._get_numeric_data().columns: ax = df[col].hist() ax.set_title(col) plt.show() # In[10]: ax = pd.plotting.scatter_matrix(df._get_numeric_data(),figsize=(10,10)) plt.show() # In[ ]: # In[ ]: # In[ ]: # In[ ]: