import sys              #only needed to determine Python version number
print('Python version ' + sys.version)

Python version 3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]


!python --version

Python 3.10.12


print("Hello, world!")

Hello, world!


#Python help - This can be done on a (I)Python console
help(len)
?len

Help on built-in function len in module builtins:

len(obj, /)
    Return the number of items in a container.


x=10
y = 5
x+y

15


# Python program explaining
# log() function
import numpy as np
out = np.log(10)
print (round(out,6))

2.302585


# importing "math" for mathematical operations
import math


# Printing the log base 10 of 10
print ("Logarithm base 10 of 10 is : ", end="")
print (math.log10(10))

Logarithm base 10 of 10 is : 1.0


exponent =5
out = math.exp(exponent)
print (round(out,4))

148.4132


# Python code to demonstrate the working of cos()
x=10
out=math.cos(x)
print (round(out,6))

-0.839072


x==y

False

x>y

True


# Python lists
a=[4,5,1,3,4,5]
print(a[2])
print(a[2:5])
print(type(a))
# Length of a
print(len(a))

1
[1, 3, 4]
<class 'list'>
6


xs = [3, 1, 2]   # Create a list
print(xs, xs[2])  # Prints "[3, 1, 2] 2"
print(xs[-1])     # Negative indices count from the end of the list; prints "2"

[3, 1, 2] 2
2


xs[2] = 'foo'    # Lists can contain elements of different types
print(xs)         # Prints "[3, 1, 'foo']"

[3, 1, 'foo']


xs.append('bar') # Add a new element to the end of the list
print(xs)   # Prints "[3, 1, 'foo', 'bar']"

[3, 1, 'foo', 'bar']


x = xs.pop()     # Remove and return the last element of the list
print(x, xs)      # Prints "bar [3, 1, 'foo']"

bar [3, 1, 'foo']


nums = list(range(5))     # range is a built-in function that creates a list of integers
print(nums)               # Prints "[0, 1, 2, 3, 4]"
print(nums[2:4])          # Get a slice from index 2 to 4 (exclusive); prints "[2, 3]"
print(nums[2:])           # Get a slice from index 2 to the end; prints "[2, 3, 4]"
print(nums[:2])           # Get a slice from the start to index 2 (exclusive); prints "[0, 1]"
print(nums[:])            # Get a slice of the whole list; prints "[0, 1, 2, 3, 4]"
print(nums[:-1])          # Slice indices can be negative; prints "[0, 1, 2, 3]"
nums[2:4] = [8, 9]        # Assign a new sublist to a slice
print(nums)

[0, 1, 2, 3, 4]
[2, 3]
[2, 3, 4]
[0, 1]
[0, 1, 2, 3, 4]
[0, 1, 2, 3]
[0, 1, 8, 9, 4]


import numpy as np
a =[5,2,3,1,7]
b =[1,5,4,6,8]
a=np.array(a)
b=np.array(b)
#Element wise addition
print(a+b)
#Element wise subtraction
print(a-b)
#Element wise product
print(a*b)
# Exponentiating the elements of a list
print(a**2)

[ 6  7  7  7 15]
[ 4 -3 -1 -5 -1]
[ 5 10 12  6 56]
[25  4  9  1 49]


#Python
import sklearn as sklearn
import pandas as pd
from sklearn import datasets
# This creates a Sklearn bunch
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
iris


#Python - size
import sklearn as sklearn
import pandas as pd
from sklearn import datasets
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
iris.shape

(150, 4)


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
print(iris.head(5))
print(iris.tail(5))

   sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
0                5.1               3.5                1.4               0.2
1                4.9               3.0                1.4               0.2
2                4.7               3.2                1.3               0.2
3                4.6               3.1                1.5               0.2
4                5.0               3.6                1.4               0.2
     sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
145                6.7               3.0                5.2               2.3
146                6.3               2.5                5.0               1.9
147                6.5               3.0                5.2               2.0
148                6.2               3.4                5.4               2.3
149                5.9               3.0                5.1               1.8


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
print(iris.info())

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 150 entries, 0 to 149
Data columns (total 4 columns):
 #   Column             Non-Null Count  Dtype  
---  ------             --------------  -----  
 0   sepal length (cm)  150 non-null    float64
 1   sepal width (cm)   150 non-null    float64
 2   petal length (cm)  150 non-null    float64
 3   petal width (cm)   150 non-null    float64
dtypes: float64(4)
memory usage: 4.8 KB
None


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
#Get column names
print(iris.columns)
## Index(['sepal length

Index(['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)',
       'petal width (cm)'],
      dtype='object')


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
iris.columns = ["lengthOfSepal","widthOfSepal","lengthOfPetal","widthOfPetal"]
print(iris.columns)

Index(['lengthOfSepal', 'widthOfSepal', 'lengthOfPetal', 'widthOfPetal'], dtype='object')


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
print(iris.info())

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 150 entries, 0 to 149
Data columns (total 4 columns):
 #   Column             Non-Null Count  Dtype  
---  ------             --------------  -----  
 0   sepal length (cm)  150 non-null    float64
 1   sepal width (cm)   150 non-null    float64
 2   petal length (cm)  150 non-null    float64
 3   petal width (cm)   150 non-null    float64
dtypes: float64(4)
memory usage: 4.8 KB
None


#Python
# To select an entire row we use .iloc. The index can be used with the ':'. If
# .iloc[start row: end row]. If start row is omitted then it implies the beginning of
# data frame, if end row is omitted then it implies all rows till end
#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
print(iris.iloc[3])
print(iris[:5])
# In python we can select columns by column name as follows
print(iris['sepal length (cm)'][2:6])
#If you want to select more than 2 columns then you must use the double '[[]]' since the
# index is a list itself
print(iris[['sepal length (cm)','sepal width (cm)']][4:7])

sepal length (cm)    4.6
sepal width (cm)     3.1
petal length (cm)    1.5
petal width (cm)     0.2
Name: 3, dtype: float64
   sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
0                5.1               3.5                1.4               0.2
1                4.9               3.0                1.4               0.2
2                4.7               3.2                1.3               0.2
3                4.6               3.1                1.5               0.2
4                5.0               3.6                1.4               0.2
2    4.7
3    4.6
4    5.0
5    5.4
Name: sepal length (cm), dtype: float64
   sepal length (cm)  sepal width (cm)
4                5.0               3.6
5                5.4               3.9
6                4.6               3.4


#Python
data = datasets.load_iris()
# Convert to Pandas dataframe
iris = pd.DataFrame(data.data, columns=data.feature_names)
print(round(iris['sepal length (cm)'].mean(),2)) #Mean
print(round(iris['sepal width (cm)'].std(),2))#Standard deviation
print(round(iris['sepal length (cm)'].max(),2))
print(round(iris['sepal length (cm)'].min(),2))
print(round(iris['sepal length (cm)'].median(),2))

5.84
0.44
7.9
4.3
5.8


# Upload local file to Colab notebook
from google.colab import files
import pandas as pd
uploaded = files.upload()

Saving cars.csv to cars.csv


# Plot the points using matplotlib
# If you don't use Colab, you can read using read_csv() from Pandas
import matplotlib.pyplot as plt
import io
cars= pd.read_csv(io.BytesIO(uploaded['cars.csv']))
plt.scatter(cars['speed'],cars['dist'])
plt.title('Scatter plot')
plt.xlabel('speed')
plt.ylabel('distance')
plt.show()


# Python: random seed; use rondom function.
# If the replication needs, it's better to read in the data
import random
random.seed(1234)


# call scipy.stats library
# import binom distribution
# round 5 decimals
from scipy.stats import binom,norm
x, n, p=4,10,0.5
round(binom.pmf(x, n, p),5)

0.20508


round(norm.cdf(1.86),5)

0.96856


round(norm.ppf(0.975),5)

1.95996


norm.rvs(size=10)

array([ 1.03133057,  0.9641532 , -1.14807617, -0.90139219,  1.53622188,
       -0.5087218 ,  2.32006624,  0.27640445, -0.67003179, -1.0523237 ])


# generate random numbers from N(100,20)
# The location (loc) keyword specifies the mean. The scale (scale) keyword specifies the standard deviation.
data_normal= norm.rvs(size=10,loc=100,scale=20)


%%shell
jupyter nbconvert --to html ///content/1A.Introduction_to_Python.ipynb

Introduction to Python¶

1. Introduction to Python¶

2. Preparations¶

3. Fundamentals¶

Colab Notebook Open in Colab¶

1. Introduction to Python¶

1.1 Powerful Statistical language: Python¶

1.2 Colab and Jupyter Notebooks¶

2. Preparations¶

3. Fundamentals¶

3.1 Before Coding¶

3.2 Use Python as Calculator¶

3.3 Data Structure: List and Data frame¶

3.3.1 List¶

3.3.2 Data frames¶

3.4 Basic Plotting¶

3.5 Probability Distributions¶

	sepal length (cm)	sepal width (cm)	petal length (cm)	petal width (cm)
0	5.1	3.5	1.4	0.2
1	4.9	3.0	1.4	0.2
2	4.7	3.2	1.3	0.2
3	4.6	3.1	1.5	0.2
4	5.0	3.6	1.4	0.2
...	...	...	...	...
145	6.7	3.0	5.2	2.3
146	6.3	2.5	5.0	1.9
147	6.5	3.0	5.2	2.0
148	6.2	3.4	5.4	2.3
149	5.9	3.0	5.1	1.8

	sepal length (cm)	sepal width (cm)	petal length (cm)	petal width (cm)
0	5.1	3.5	1.4	0.2
1	4.9	3.0	1.4	0.2
2	4.7	3.2	1.3	0.2
3	4.6	3.1	1.5	0.2
4	5.0	3.6	1.4	0.2
...	...	...	...	...
145	6.7	3.0	5.2	2.3
146	6.3	2.5	5.0	1.9
147	6.5	3.0	5.2	2.0
148	6.2	3.4	5.4	2.3
149	5.9	3.0	5.1	1.8

	sepal length (cm)	sepal width (cm)	petal length (cm)	petal width (cm)
0	5.1	3.5	1.4	0.2
1	4.9	3.0	1.4	0.2
2	4.7	3.2	1.3	0.2
3	4.6	3.1	1.5	0.2
4	5.0	3.6	1.4	0.2
...	...	...	...	...
145	6.7	3.0	5.2	2.3
146	6.3	2.5	5.0	1.9
147	6.5	3.0	5.2	2.0
148	6.2	3.4	5.4	2.3
149	5.9	3.0	5.1	1.8