HOME/Articles/

matplotlib example eda imports (snippet)

Article Outline

Python matplotlib example 'eda imports'

Modules used in program:

  • import matplotlib.pyplot as plt
  • import matplotlib as mpl
  • import matplotlib.style # https://matplotlib.org/users/dflt_style_changes.html
  • import scipy.stats as stats
  • import pandas as pd
  • import numpy as np
  • import pytz
  • import calendar
  • import multiprocessing
  • import pickle
  • import functools
  • import itertools
  • import tempfile
  • import datetime
  • import csv
  • import re
  • import json
  • import glob
  • import sys
  • import time
  • import gzip
  • import io
  • import os

python eda imports

Python matplotlib example: eda imports

import os
import io
import gzip
import time
import sys
import glob
import json
import re
import csv
import datetime
import tempfile
import itertools
import functools
import pickle
import multiprocessing
import calendar
from collections import Counter

import pytz
import numpy as np
import pandas as pd
from pandas.plotting import scatter_matrix
import scipy.stats as stats
from scipy import interp
from scipy.cluster.hierarchy import dendrogram, linkage, fcluster, fclusterdata
from tqdm import tqdm

import matplotlib.style    # https://matplotlib.org/users/dflt_style_changes.html
import matplotlib as mpl
# mpl.use('Agg')    # has to be before pyplot import
import matplotlib.pyplot as plt
from mpl_toolkits.mplot3d import Axes3D
from IPython.display import display, Image, HTML
try:
  import seaborn as sns
except ImportError:
  print('seaborn not found')

try:
  from sqlalchemy import create_engine
except ImportError:
  print('sqlalchemy not found')

# related to preprocessing 
from sklearn.preprocessing import LabelEncoder, OneHotEncoder, StandardScaler, Normalizer, label_binarize
from sklearn.feature_selection import SelectKBest, chi2
from sklearn.model_selection import GridSearchCV

# related to unsupervised learning 
from sklearn.decomposition import TruncatedSVD, PCA
from sklearn.manifold import TSNE
from sklearn.neighbors import KNeighborsClassifier
from sklearn.cluster import KMeans

# related to learning
from sklearn.linear_model import LogisticRegression, LogisticRegressionCV, LinearRegression
from sklearn import svm
from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor, export_graphviz
from sklearn.ensemble import  GradientBoostingRegressor, GradientBoostingClassifier, AdaBoostClassifier, RandomForestClassifier
from sklearn.multiclass import OneVsRestClassifier, OneVsOneClassifier

# related to evaluation
from sklearn.model_selection import StratifiedKFold, train_test_split, cross_val_score
from sklearn import metrics
kappa_scorer = metrics.make_scorer(metrics.cohen_kappa_score)

pd.set_option('display.max_columns', 250)
pd.set_option('display.max_rows', 250)
# Don't cut off long string
# http://stackoverflow.com/questions/26277757/pandas-to-html-truncates-string-contents
pd.set_option('display.max_colwidth', -1)

mpl.style.use('classic')
mpl.rcParams['figure.figsize'] = (8, 4.5)
get_ipython().magic('matplotlib inline')
get_ipython().run_line_magic('config', "InlineBackend.figure_format = 'retina'")

# for auto-reloading external modules
# see http://stackoverflow.com/questions/1907993/autoreload-of-modules-in-ipython
get_ipython().magic('load_ext autoreload')
get_ipython().magic('autoreload 2')

display(HTML(data="""
<style>
   div#notebook-container    { width: 100%; }
   div#menubar-container     { width: 100%; }
   div#maintoolbar-container { width: 100%; }
</style>
"""))