#!/usr/bin/env python # coding: utf-8 # In[1]: # IMPORT import pandas as pd # ### Pandas Data Structure - Series # In[2]: sr = pd.Series([1,2,3,-3,4,0]) print(sr) # In[3]: # get values frm Series print(sr.values) # In[4]: # get indexes from Series print(sr.index) # In[5]: # some calc on Seires print("2nd indexed value:",sr[2], "\nadding 2nd + 4rd index:", sr[2]+sr[4]) # In[6]: # creating Series with named index sr1 = pd.Series([1,2,0,-3,4,-6], index=['a','b','c','d','e','f']) print(sr1) # In[7]: for e in sr1.index: print(e, "\t", sr1[e]) # In[8]: # getting only positive values from Series print(sr1[sr1>=0]) # In[9]: # we can convert a dictionary into Series sdata = {'Ohio': 35000, 'Texas': 71000, 'Oregon': 16000, 'Utah': 5000} print(sdata, type(sdata)) # In[10]: sr2 = pd.Series(sdata) print(sr2) # In[11]: ind = ['California', 'Alabama', 'Oregon', 'Texas'] sr3 = pd.Series(sdata, index=ind) print(sr3) # In[12]: # Californica and Alabama's value is NaN (Not a Number) cause there is no value for these index in sdata # let's check for NULLability print(pd.isnull(sr3)) # In[13]: print(pd.notnull(sr3)) # In[14]: print(sr2+sr3) # In[15]: # Series object can have Name and index Name sr3.name = "States" sr3.index.name = "Population" print(sr3) # In[16]: # Stats about Series print(sr3.name,"\t",sr3.shape,"\t",len(sr3)) #print name, shape and length # In[17]: print(sr3.index,"\t",sr3.index.name) #print indexes and index name # In[18]: print(sr3.dtype) #print data type # In[19]: print(sr3.values) #print Series values #