#!/usr/bin/env python # coding: utf-8 # # Installation # In[ ]: # run this cell to install pycaret in Google Colab # !pip install pycaret # In[ ]: # If you are using Jupyter notebook, you can pip install pycaret using jupyter notebook or command line # pip install pycaret # In[1]: from pycaret.utils import version version() # # 1. Importing Dataset # In[2]: from pycaret.datasets import get_data data = get_data('juice') # # 2. Setting up Environment # In[3]: from pycaret.classification import * clf1 = setup(data, target = 'Purchase', session_id=786) # # 3. Compare Models # In[4]: compare_models() # # 4. Create Model # In[5]: lr = create_model('lr') # In[6]: dt = create_model('dt') # # 5. Tune Model # In[7]: tuned_dt = tune_model('dt') # In[8]: tuned_nb = tune_model('nb', optimize = 'AUC', n_iter=20) # In[ ]: # # 6. Ensemble Model # In[9]: bagged_dt = ensemble_model(dt) # In[10]: boosted_dt = ensemble_model(dt, method = 'Boosting') # In[ ]: # # 7. Blend Models # In[11]: lr = create_model('lr', verbose=False) lda = create_model('lda', verbose=False) gbc = create_model('gbc', verbose=False) # In[12]: blender = blend_models(estimator_list=[lr,lda,gbc], method = 'soft') # In[13]: blender.estimators_ # # 8. Analyze Model # In[14]: plot_model(blender) # In[15]: plot_model(blender, plot = 'confusion_matrix') # In[16]: plot_model(blender, plot = 'threshold') # In[17]: plot_model(blender, plot = 'pr') # In[18]: plot_model(tuned_dt, plot = 'vc') # In[19]: plot_model(dt, plot = 'boundary') # In[20]: plot_model(tuned_nb, plot = 'boundary') # In[21]: plot_model(blender, plot = 'boundary') # In[22]: evaluate_model(tuned_nb) # # 9. Interpret Model # In[23]: xgboost = create_model('xgboost') # In[24]: interpret_model(xgboost) # In[25]: interpret_model(xgboost, plot = 'correlation') # In[26]: interpret_model(xgboost, plot = 'reason', observation=1) # In[27]: interpret_model(xgboost, plot = 'reason') # # Learning Resources: # # - PyCaret Classification Module : https://www.pycaret.org/classification # - Binary Classification Tutorial (Level Beginner) : https://pycaret.org/clf101/ # - Binary Classification Tutorial (Level Intermediate) : https://pycaret.org/clf102/ # - Kaggle Titanic Predictions (Video Tutorial) : https://www.youtube.com/watch?v=nqMM6rngNCA