Agenda = '''
1. Built in Exception
2. User Define Exception
3. Data Science Introduction
4. Numpy
    a) Array 
    b) Matrix
5. pandas 
    a) Series
    b) Dataframe
6. Matplotlib
    a) Visualisation of Data
7. Data Science Case Study 
8. Summary and Conclusion
'''

Exception in Python¶

data = int(input("Enter Some data:"))

Enter Some data:hi

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-2-42575b99cd48> in <module>
----> 1 data = int(input("Enter Some data:"))

ValueError: invalid literal for int() with base 10: 'hi'

data = int(input("Enter Some data:"))

Enter Some data:34

hi

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-4-55ca6286e3e4> in <module>
----> 1 hi

NameError: name 'hi' is not defined

dir(Exception)

['__cause__',
 '__class__',
 '__context__',
 '__delattr__',
 '__dict__',
 '__dir__',
 '__doc__',
 '__eq__',
 '__format__',
 '__ge__',
 '__getattribute__',
 '__gt__',
 '__hash__',
 '__init__',
 '__init_subclass__',
 '__le__',
 '__lt__',
 '__ne__',
 '__new__',
 '__reduce__',
 '__reduce_ex__',
 '__repr__',
 '__setattr__',
 '__setstate__',
 '__sizeof__',
 '__str__',
 '__subclasshook__',
 '__suppress_context__',
 '__traceback__',
 'args',
 'with_traceback']

help(Exception)

Help on class Exception in module builtins:

class Exception(BaseException)
 |  Common base class for all non-exit exceptions.
 |  
 |  Method resolution order:
 |      Exception
 |      BaseException
 |      object
 |  
 |  Methods defined here:
 |  
 |  __init__(self, /, *args, **kwargs)
 |      Initialize self.  See help(type(self)) for accurate signature.
 |  
 |  ----------------------------------------------------------------------
 |  Static methods defined here:
 |  
 |  __new__(*args, **kwargs) from builtins.type
 |      Create and return a new object.  See help(type) for accurate signature.
 |  
 |  ----------------------------------------------------------------------
 |  Methods inherited from BaseException:
 |  
 |  __delattr__(self, name, /)
 |      Implement delattr(self, name).
 |  
 |  __getattribute__(self, name, /)
 |      Return getattr(self, name).
 |  
 |  __reduce__(...)
 |      Helper for pickle.
 |  
 |  __repr__(self, /)
 |      Return repr(self).
 |  
 |  __setattr__(self, name, value, /)
 |      Implement setattr(self, name, value).
 |  
 |  __setstate__(...)
 |  
 |  __str__(self, /)
 |      Return str(self).
 |  
 |  with_traceback(...)
 |      Exception.with_traceback(tb) --
 |      set self.__traceback__ to tb and return self.
 |  
 |  ----------------------------------------------------------------------
 |  Data descriptors inherited from BaseException:
 |  
 |  __cause__
 |      exception cause
 |  
 |  __context__
 |      exception context
 |  
 |  __dict__
 |  
 |  __suppress_context__
 |  
 |  __traceback__
 |  
 |  args

help(BaseException)

Help on class BaseException in module builtins:

class BaseException(object)
 |  Common base class for all exceptions
 |  
 |  Methods defined here:
 |  
 |  __delattr__(self, name, /)
 |      Implement delattr(self, name).
 |  
 |  __getattribute__(self, name, /)
 |      Return getattr(self, name).
 |  
 |  __init__(self, /, *args, **kwargs)
 |      Initialize self.  See help(type(self)) for accurate signature.
 |  
 |  __reduce__(...)
 |      Helper for pickle.
 |  
 |  __repr__(self, /)
 |      Return repr(self).
 |  
 |  __setattr__(self, name, value, /)
 |      Implement setattr(self, name, value).
 |  
 |  __setstate__(...)
 |  
 |  __str__(self, /)
 |      Return str(self).
 |  
 |  with_traceback(...)
 |      Exception.with_traceback(tb) --
 |      set self.__traceback__ to tb and return self.
 |  
 |  ----------------------------------------------------------------------
 |  Static methods defined here:
 |  
 |  __new__(*args, **kwargs) from builtins.type
 |      Create and return a new object.  See help(type) for accurate signature.
 |  
 |  ----------------------------------------------------------------------
 |  Data descriptors defined here:
 |  
 |  __cause__
 |      exception cause
 |  
 |  __context__
 |      exception context
 |  
 |  __dict__
 |  
 |  __suppress_context__
 |  
 |  __traceback__
 |  
 |  args

Handle Exception¶

try:
    data = int(input("Enter Some data:"))
except ValueError as e:
    print("Enter Integer Value only::",e )
else:
    print("Your data is", data)

Enter Some data:hi
Enter Integer Value only:: invalid literal for int() with base 10: 'hi'

while True:
    try:
        data = int(input("Enter Some data:"))
    except ValueError as e:
        print("Enter Integer Value only::",e )
    else:
        print("Your data is", data)
        break

Enter Some data:hi
Enter Integer Value only:: invalid literal for int() with base 10: 'hi'
Enter Some data:343
Your data is 343

User Define Exception¶

%%writefile ShortInputModule.py

'''User Define Exception Module. 
ShortInput Exception. It should raise ShortInput Exception 
for the data of length less than six bytes ( chars ).
'''

class ShortInput(Exception):  # Subclass of Exception Class
    
    ''' ShortInput Exception. It should raise ShortInput Exception 
for the data of length less than six bytes ( chars ).'''
    
    def __init__(self, inputdata, atleast):
        '''Initialise ShortInput Class with data and minimum size'''
        self.inputdata = inputdata
        self.atleast = atleast
        
        print("Your input data size is %d bytes which is shorter than \
expected data %d bytes"%(inputdata, atleast))


if __name__ == '__main__':
    Ob1 = ShortInput(5, 6)

Overwriting ShortInputModule.py

from ShortInputModule import ShortInput

help(ShortInput)

Help on class ShortInput in module ShortInputModule:

class ShortInput(builtins.Exception)
 |  ShortInput(inputdata, atleast)
 |  
 |  ShortInput Exception. It should raise ShortInput Exception 
 |  for the data of length less than six bytes ( chars ).
 |  
 |  Method resolution order:
 |      ShortInput
 |      builtins.Exception
 |      builtins.BaseException
 |      builtins.object
 |  
 |  Methods defined here:
 |  
 |  __init__(self, inputdata, atleast)
 |      Initialise ShortInput Class with data and minimum size
 |  
 |  ----------------------------------------------------------------------
 |  Data descriptors defined here:
 |  
 |  __weakref__
 |      list of weak references to the object (if defined)
 |  
 |  ----------------------------------------------------------------------
 |  Static methods inherited from builtins.Exception:
 |  
 |  __new__(*args, **kwargs) from builtins.type
 |      Create and return a new object.  See help(type) for accurate signature.
 |  
 |  ----------------------------------------------------------------------
 |  Methods inherited from builtins.BaseException:
 |  
 |  __delattr__(self, name, /)
 |      Implement delattr(self, name).
 |  
 |  __getattribute__(self, name, /)
 |      Return getattr(self, name).
 |  
 |  __reduce__(...)
 |      Helper for pickle.
 |  
 |  __repr__(self, /)
 |      Return repr(self).
 |  
 |  __setattr__(self, name, value, /)
 |      Implement setattr(self, name, value).
 |  
 |  __setstate__(...)
 |  
 |  __str__(self, /)
 |      Return str(self).
 |  
 |  with_traceback(...)
 |      Exception.with_traceback(tb) --
 |      set self.__traceback__ to tb and return self.
 |  
 |  ----------------------------------------------------------------------
 |  Data descriptors inherited from builtins.BaseException:
 |  
 |  __cause__
 |      exception cause
 |  
 |  __context__
 |      exception context
 |  
 |  __dict__
 |  
 |  __suppress_context__
 |  
 |  __traceback__
 |  
 |  args

import ShortInputModule

help(ShortInputModule)

Help on module ShortInputModule:

NAME
    ShortInputModule

DESCRIPTION
    User Define Exception Module. 
    ShortInput Exception. It should raise ShortInput Exception 
    for the data of length less than six bytes ( chars ).

CLASSES
    builtins.Exception(builtins.BaseException)
        ShortInput
    
    class ShortInput(builtins.Exception)
     |  ShortInput(inputdata, atleast)
     |  
     |  ShortInput Exception. It should raise ShortInput Exception 
     |  for the data of length less than six bytes ( chars ).
     |  
     |  Method resolution order:
     |      ShortInput
     |      builtins.Exception
     |      builtins.BaseException
     |      builtins.object
     |  
     |  Methods defined here:
     |  
     |  __init__(self, inputdata, atleast)
     |      Initialise ShortInput Class with data and minimum size
     |  
     |  ----------------------------------------------------------------------
     |  Data descriptors defined here:
     |  
     |  __weakref__
     |      list of weak references to the object (if defined)
     |  
     |  ----------------------------------------------------------------------
     |  Static methods inherited from builtins.Exception:
     |  
     |  __new__(*args, **kwargs) from builtins.type
     |      Create and return a new object.  See help(type) for accurate signature.
     |  
     |  ----------------------------------------------------------------------
     |  Methods inherited from builtins.BaseException:
     |  
     |  __delattr__(self, name, /)
     |      Implement delattr(self, name).
     |  
     |  __getattribute__(self, name, /)
     |      Return getattr(self, name).
     |  
     |  __reduce__(...)
     |      Helper for pickle.
     |  
     |  __repr__(self, /)
     |      Return repr(self).
     |  
     |  __setattr__(self, name, value, /)
     |      Implement setattr(self, name, value).
     |  
     |  __setstate__(...)
     |  
     |  __str__(self, /)
     |      Return str(self).
     |  
     |  with_traceback(...)
     |      Exception.with_traceback(tb) --
     |      set self.__traceback__ to tb and return self.
     |  
     |  ----------------------------------------------------------------------
     |  Data descriptors inherited from builtins.BaseException:
     |  
     |  __cause__
     |      exception cause
     |  
     |  __context__
     |      exception context
     |  
     |  __dict__
     |  
     |  __suppress_context__
     |  
     |  __traceback__
     |  
     |  args

DATA
    Ob1 = ShortInput(5, 6)

FILE
    /Users/surendra/ShortInputModule.py

from ShortInputModule import ShortInput


while True:
    try:
        data = input("Enter Some data:")
        if len(data) < 6:
            raise ShortInput(len(data), 6)
    except ShortInput as e:
        print("Shortinput Exception Occurred",e )
    else:
        print("Your data is", data)
        break

Enter Some data:3434
Your input data size is 4 bytes which is shorter than expected data 6 bytes
Shortinput Exception Occurred (4, 6)
Enter Some data:242329389
Your data is 242329389

Numpy¶

Numpy is multidimensional array and matrices ( 2 dimension ) librarary.

List Addition¶

import numpy as np

List1 = list(range(1,10))

print(List1)

List2 = list(range(11,20))

print(List2)

List3 = List1 + List2

print(List3)

[1, 2, 3, 4, 5, 6, 7, 8, 9]
[11, 12, 13, 14, 15, 16, 17, 18, 19]
[1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19]

Array Addition¶

Array1 = np.array(List1)
print(Array1)



Array2 = np.array(List2)
print(Array2)



Array3 = Array1 + Array2

print(Array3)

[1 2 3 4 5 6 7 8 9]
[11 12 13 14 15 16 17 18 19]
[12 14 16 18 20 22 24 26 28]

Array Dimension¶

print(Array1.ndim)

1

Array Shape¶

print(Array1.shape)

(9,)

Array Item Size¶

print(Array1.itemsize)

8

Array Data Type¶

Array1.dtype

dtype('int64')

Array Reshape¶

print("\n Create Array of 15 items \n")

Array4 = np.arange(1,16)

print(Array4)

print("Dimension of Array: ", Array4.ndim)

print("Shape of the Array")

print(Array4.shape)

print("\n Reshape Array")

Array5 = Array4.reshape(3,5)

print(Array5)

print("\n Modified Shape of the Array \n")

print(Array5.shape)

print("\n New Dimension of Array is ",Array5.ndim)

 Create Array of 15 items 

[ 1  2  3  4  5  6  7  8  9 10 11 12 13 14 15]
Dimension of Array:  1
Shape of the Array
(15,)

 Reshape Array
[[ 1  2  3  4  5]
 [ 6  7  8  9 10]
 [11 12 13 14 15]]

 Modified Shape of the Array 

(3, 5)

 New Dimension of Array is  2

Trasponse of Array¶

Array5

array([[ 1,  2,  3,  4,  5],
       [ 6,  7,  8,  9, 10],
       [11, 12, 13, 14, 15]])

Array6 = Array5.T
Array6

array([[ 1,  6, 11],
       [ 2,  7, 12],
       [ 3,  8, 13],
       [ 4,  9, 14],
       [ 5, 10, 15]])

Subscripting of Array¶

# First row of array5 

Array5[0]

array([1, 2, 3, 4, 5])

# First column of array5 

Array5[:,0]

array([ 1,  6, 11])

# Second row and second column of array5 

Array5[1:2,1:2]

array([[7]])

# Second Row and third and Fourth column 

print(Array5[1:, 2:4])

[[ 8  9]
 [13 14]]

# Alternate Rows and Alaternate Columns

print("\n Alternate Rows \n ")

print(Array5[::2, :])

print("\nAlternate Columns \n")

print(Array5[:, ::2])

 Alternate Rows 
 
[[ 1  2  3  4  5]
 [11 12 13 14 15]]

Alternate Columns 

[[ 1  3  5]
 [ 6  8 10]
 [11 13 15]]

#dir(Array5)

Array5.sum()

120

Array5.max()

15

Array5.min()

1

Array5.mean()

8.0

Array5.std()

4.320493798938574

print("Change Array Type to float32 ")

Array7 = Array5.astype('float32')
print(Array7)

print("\n Array Data Type :")
print(Array7.dtype)

Change Array Type to float32 
[[ 1.  2.  3.  4.  5.]
 [ 6.  7.  8.  9. 10.]
 [11. 12. 13. 14. 15.]]

 Array Data Type :
float32

Matrix using Array¶

Matrix is a two dimensional array.

Mat1 = np.matrix(Array1)

print(Mat1)

print(Mat1.ndim)

[[1 2 3 4 5 6 7 8 9]]
2

Mat2 = np.matrix(Array5)

print(Mat2)

print(Mat2.ndim)

[[ 1  2  3  4  5]
 [ 6  7  8  9 10]
 [11 12 13 14 15]]
2

# Transpose of Matrix 

Mat3 = Mat2.T
print(Mat3)

[[ 1  6 11]
 [ 2  7 12]
 [ 3  8 13]
 [ 4  9 14]
 [ 5 10 15]]

# Inverse of Matrix 

Mat5 = Mat2.I
print(Mat5)

[[-2.46666667e-01 -6.66666667e-02  1.13333333e-01]
 [-1.33333333e-01 -3.33333333e-02  6.66666667e-02]
 [-2.00000000e-02 -2.51534904e-17  2.00000000e-02]
 [ 9.33333333e-02  3.33333333e-02 -2.66666667e-02]
 [ 2.06666667e-01  6.66666667e-02 -7.33333333e-02]]

Pandas¶

1. Pandas is a software library written for the Python programming language for data manipulation and analysis.
2. DataFrame object for data manipulation with integrated indexing.
3.Tools for reading and writing data between in-memory data structures and different file formats.
4.Data alignment and integrated handling of missing data.
5. Reshaping and pivoting of data sets.
6.Label-based slicing, fancy indexing, and subsetting of large data sets.
7. Data structure column insertion and deletion.
8. Group by engine allowing split-apply-combine operations on data sets.
9. Data set merging and joining.
10. Hierarchical axis indexing to work with high-dimensional data in a lower-dimensional data structure.
11. Time series-functionality: Date range generation and frequency conversion, moving window statistics, moving window linear regressions, date shifting and lagging.
12. Provides data filtration.

import pandas as pd

EmpName = ["Amit", "Amar", "Akabar", "Anthony", "Isha", "Disha", "Hema"]

Salary = [200000, 300000, 400000, 500000, 250000, 350000, 100000] 

print("\n Employee Name Series \n")

Series1 = pd.Series(EmpName)

print(Series1)

print("\n Employee Salary Series \n ")

Series2 = pd.Series(Salary)

print(Series2)

 Employee Name Series 

0       Amit
1       Amar
2     Akabar
3    Anthony
4       Isha
5      Disha
6       Hema
dtype: object

 Employee Salary Series 
 
0    200000
1    300000
2    400000
3    500000
4    250000
5    350000
6    100000
dtype: int64

#dir(pd.Series)

EmpDict = dict(zip(EmpName, Salary))
print(EmpDict)

{'Amit': 200000, 'Amar': 300000, 'Akabar': 400000, 'Anthony': 500000, 'Isha': 250000, 'Disha': 350000, 'Hema': 100000}

EmpSeries = pd.Series(EmpDict)

print(EmpSeries)

Amit       200000
Amar       300000
Akabar     400000
Anthony    500000
Isha       250000
Disha      350000
Hema       100000
dtype: int64

EmpSeries.index

Index(['Amit', 'Amar', 'Akabar', 'Anthony', 'Isha', 'Disha', 'Hema'], dtype='object')

EmpSeries.values

array([200000, 300000, 400000, 500000, 250000, 350000, 100000])

EmpSeries.keys()

Index(['Amit', 'Amar', 'Akabar', 'Anthony', 'Isha', 'Disha', 'Hema'], dtype='object')

EmpSeries.value_counts()

300000    1
100000    1
350000    1
500000    1
250000    1
400000    1
200000    1
dtype: int64

EmpSeries['Amit']

200000

EmpSeries['Amit'] = 300000

EmpSeries

Amit       300000
Amar       300000
Akabar     400000
Anthony    500000
Isha       250000
Disha      350000
Hema       100000
dtype: int64

EmpSeries.ndim

1

EmpSeries.shape

(7,)

EmpSeries.max()

500000

EmpSeries.mean()

314285.71428571426

EmpSeries.min()

100000

EmpSeries.sum()

2200000

EmpSeries.dtype

dtype('int64')

EmpSeries.dtypes

dtype('int64')

EmpSeries[:3]

Amit      300000
Amar      300000
Akabar    400000
dtype: int64

EmpSeries[2:]

Akabar     400000
Anthony    500000
Isha       250000
Disha      350000
Hema       100000
dtype: int64

Pandas DataFrame¶

df = pd.DataFrame(EmpSeries)

df.columns

RangeIndex(start=0, stop=1, step=1)

df.index

Index(['Amit', 'Amar', 'Akabar', 'Anthony', 'Isha', 'Disha', 'Hema'], dtype='object')

df.ndim

2

df.dtypes

0    int64
dtype: object

df.shape

(7, 1)

df.columns=['Salary']

df

df['Salary']

Amit       300000
Amar       300000
Akabar     400000
Anthony    500000
Isha       250000
Disha      350000
Hema       100000
Name: Salary, dtype: int64

df['Salary'].max()

500000

df['Salary'].mean()

314285.71428571426

df['Salary'].sum()

2200000

df.describe()

df.Salary

Amit       300000
Amar       300000
Akabar     400000
Anthony    500000
Isha       250000
Disha      350000
Hema       100000
Name: Salary, dtype: int64

df.Salary.plot()

<matplotlib.axes._subplots.AxesSubplot at 0x126eefa50>

df.info()

<class 'pandas.core.frame.DataFrame'>
Index: 7 entries, Amit to Hema
Data columns (total 1 columns):
Salary    7 non-null int64
dtypes: int64(1)
memory usage: 432.0+ bytes

df1 = pd.DataFrame(zip(EmpName,Salary))
print(df1)

         0       1
0     Amit  200000
1     Amar  300000
2   Akabar  400000
3  Anthony  500000
4     Isha  250000
5    Disha  350000
6     Hema  100000

df1.columns

RangeIndex(start=0, stop=2, step=1)

df1.columns = ['EmpName', 'EmpSalary']

df1

df1.shape

(7, 2)

df1.index

RangeIndex(start=0, stop=7, step=1)

df1.describe()

df1.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 7 entries, 0 to 6
Data columns (total 2 columns):
EmpName      7 non-null object
EmpSalary    7 non-null int64
dtypes: int64(1), object(1)
memory usage: 240.0+ bytes

df1.to_csv('EmpData.csv',index=False)

cat Empdata.csv

EmpName,EmpSalary
Amit,200000
Amar,300000
Akabar,400000
Anthony,500000
Isha,250000
Disha,350000
Hema,100000

pwd

'/Users/surendra'

path = r'/Users/surendra/Empdata.csv'

df2 = pd.read_csv(path)
df2

df2['EmpName']

0       Amit
1       Amar
2     Akabar
3    Anthony
4       Isha
5      Disha
6       Hema
Name: EmpName, dtype: object

df2['EmpSalary']

0    200000
1    300000
2    400000
3    500000
4    250000
5    350000
6    100000
Name: EmpSalary, dtype: int64

df2.iloc[:3]

df2.iloc[0:5]

df2[:2]

df2.EmpName

0       Amit
1       Amar
2     Akabar
3    Anthony
4       Isha
5      Disha
6       Hema
Name: EmpName, dtype: object

df2.head()

df2.tail()

df2.sort_values('EmpSalary')

df2.sort_values('EmpName', ascending = False )

df2.plot(kind = 'bar')

<matplotlib.axes._subplots.AxesSubplot at 0x12b86bed0>

df2.plot(kind = 'line')

<matplotlib.axes._subplots.AxesSubplot at 0x12b691510>

df2.plot.hist()

<matplotlib.axes._subplots.AxesSubplot at 0x12b5f0750>

df2.plot(kind = 'barh')

<matplotlib.axes._subplots.AxesSubplot at 0x12b748ed0>

df2.plot(kind = 'pie',x='EmpName',y='EmpSalary', figsize = (7,5),use_index = True)

<matplotlib.axes._subplots.AxesSubplot at 0x12d253e90>

df2.plot(kind = 'area',x='EmpName',y='EmpSalary', use_index=True, figsize = (8,8))

<matplotlib.axes._subplots.AxesSubplot at 0x12cf4bd90>

df2.plot(kind = 'hist',x='EmpName',y='EmpSalary', figsize = (8,5))

<matplotlib.axes._subplots.AxesSubplot at 0x12c958510>

df2.plot(kind = 'box',x='EmpName',y='EmpSalary', figsize = (8,8))

<matplotlib.axes._subplots.AxesSubplot at 0x12bd8a050>

	Salary
count	7.000000
mean	314285.714286
std	124880.895638
min	100000.000000
25%	275000.000000
50%	300000.000000
75%	375000.000000
max	500000.000000

	EmpSalary
count	7.000000
mean	300000.000000
std	132287.565553
min	100000.000000
25%	225000.000000
50%	300000.000000
75%	375000.000000
max	500000.000000

	Salary
Amit	300000
Amar	300000
Akabar	400000
Anthony	500000
Isha	250000
Disha	350000
Hema	100000

	EmpName	EmpSalary
0	Amit	200000
1	Amar	300000
2	Akabar	400000
3	Anthony	500000
4	Isha	250000
5	Disha	350000
6	Hema	100000