my_list = [] #create empty list
print(my_list)
my_list = [1, 2, 3, 'example', 3.132] #creating list with data
print(my_list)

[]
[1, 2, 3, 'example', 3.132]


my_list = [1, 2, 3]
print(my_list)
my_list.append([555, 12]) #add as a single element
print(my_list)
my_list.extend([234, 'more_example']) #add as different elements
print(my_list)
my_list.insert(1, 'insert_example') #add element i
print(my_list)

[1, 2, 3]
[1, 2, 3, [555, 12]]
[1, 2, 3, [555, 12], 234, 'more_example']
[1, 'insert_example', 2, 3, [555, 12], 234, 'more_example']


my_list = [1, 2, 3, 'example', 3.132, 10, 30]
del my_list[5] #delete element at index 5
print(my_list)
my_list.remove('example') #remove element with value
print(my_list)
a = my_list.pop(1) #pop element from list
print('Popped Element: ', a, ' List remaining: ', my_list)
my_list.clear() #empty the list
print(my_list)

[1, 2, 3, 'example', 3.132, 30]
[1, 2, 3, 3.132, 30]
Popped Element:  2  List remaining:  [1, 3, 3.132, 30]
[]


my_list = [1, 2, 3, 'example', 3.132, 10, 30]
for element in my_list: #access elements one by one
    print(element)
print(my_list) #access all elements
print(my_list[3]) #access index 3 element
print(my_list[0:2]) #access elements from 0 to 1 and exclude 2
print(my_list[::-1]) #access elements in reverse

1
2
3
example
3.132
10
30
[1, 2, 3, 'example', 3.132, 10, 30]
example
[1, 2]
[30, 10, 3.132, 'example', 3, 2, 1]


my_list = [1, 2, 3, 10, 30, 10]
print(len(my_list)) #find length of list
print(my_list.index(10)) #find index of element that occurs first
print(my_list.count(10)) #find count of the element
print(sorted(my_list)) #print sorted list but not change original
my_list.sort(reverse=True) #sort original list
print(my_list)

6
3
2
[1, 2, 3, 10, 10, 30]
[30, 10, 10, 3, 2, 1]


my_dict = {} #empty dictionary
print(my_dict)
my_dict = {1: 'Python', 2: 'Java'} #dictionary with elements
print(my_dict)

{}
{1: 'Python', 2: 'Java'}


my_dict = {'First': 'Python', 'Second': 'Java'}
print(my_dict)
my_dict['Second'] = 'C++' #changing element
print(my_dict)
my_dict['Third'] = 'Ruby' #adding key-value pair
print(my_dict)

{'First': 'Python', 'Second': 'Java'}
{'First': 'Python', 'Second': 'C++'}
{'First': 'Python', 'Second': 'C++', 'Third': 'Ruby'}


my_dict = {'First': 'Python', 'Second': 'Java', 'Third': 'Ruby'}
a = my_dict.pop('Third') #pop element
print('Value:', a)
print('Dictionary:', my_dict)
b = my_dict.popitem() #pop the key-value pair
print('Key, value pair:', b)
print('Dictionary', my_dict)
my_dict.clear() #empty dictionary
print('n', my_dict)

Value: Ruby
Dictionary: {'First': 'Python', 'Second': 'Java'}
Key, value pair: ('Second', 'Java')
Dictionary {'First': 'Python'}
n {}


my_dict = {'First': 'Python', 'Second': 'Java'}
print(my_dict['First']) #access elements using keys
print(my_dict.get('Second'))

Python
Java


my_dict = {'First': 'Python', 'Second': 'Java', 'Third': 'Ruby'}
print(my_dict.keys()) #get keys
print(my_dict.values()) #get values
print(my_dict.items()) #get key-value pairs
print(my_dict.get('First'))

dict_keys(['First', 'Second', 'Third'])
dict_values(['Python', 'Java', 'Ruby'])
dict_items([('First', 'Python'), ('Second', 'Java'), ('Third', 'Ruby')])
Python


my_tuple = (1, 2, 3) #create tuple
print(my_tuple)

(1, 2, 3)


my_tuple2 = (1, 2, 3, 'edureka') #access elements
for x in my_tuple2:
    print(x)
print(my_tuple2)
print(my_tuple2[0])
print(my_tuple2[:])
print(my_tuple2[3][4])

1
2
3
edureka
(1, 2, 3, 'edureka')
1
(1, 2, 3, 'edureka')
e


my_tuple = (1, 2, 3)
my_tuple = my_tuple + (4, 5, 6) #add elements
print(my_tuple)

(1, 2, 3, 4, 5, 6)


my_tuple = (1, 2, 3, ['hindi', 'python'])
my_tuple[3][0] = 'english'
print(my_tuple)
print(my_tuple.count(2))
print(my_tuple.index(['english', 'python']))

(1, 2, 3, ['english', 'python'])
1
3


my_set = {1, 2, 3, 4, 5, 5, 5} #create set
print(my_set)

{1, 2, 3, 4, 5}


my_set = {1, 2, 3}
my_set.add(4) #add element to set
print(my_set)

{1, 2, 3, 4}


my_set = {1, 2, 3, 4}
my_set_2 = {3, 4, 5, 6}
print(my_set.union(my_set_2), '----------', my_set | my_set_2)
print(my_set.intersection(my_set_2), '----------', my_set & my_set_2)
print(my_set.difference(my_set_2), '----------', my_set - my_set_2)
print(my_set.symmetric_difference(my_set_2), '----------', my_set ^ my_set_2)
my_set.clear()
print(my_set)

{1, 2, 3, 4, 5, 6} ---------- {1, 2, 3, 4, 5, 6}
{3, 4} ---------- {3, 4}
{1, 2} ---------- {1, 2}
{1, 2, 5, 6} ---------- {1, 2, 5, 6}
set()


import numpy as np
 
# creating list
list = [1, 2, 3, 4]
 
# creating numpy array
sample_array = np.array(list)
print("List in python : ", list)
print("Numpy Array in python :",
      sample_array)

List in python :  [1, 2, 3, 4]
Numpy Array in python : [1 2 3 4]


# importing numpy module
import numpy as np
 
# creating list
list_1 = [1, 2, 3, 4]
list_2 = [5, 6, 7, 8]
list_3 = [9, 10, 11, 12]
 
# creating numpy array
sample_array = np.array([list_1,
                         list_2,
                         list_3])
 
print("Numpy multi dimensional array in python\n",
      sample_array)

Numpy multi dimensional array in python
 [[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]


# importing numpy module
import numpy as np
 
# creating list
list_1 = [1, 2, 3, 4]
list_2 = [5, 6, 7, 8]
list_3 = [9, 10, 11, 12]
 
# creating numpy array
sample_array = np.array([list_1,
                         list_2,
                         list_3])
 
print("Numpy array :")
print(sample_array)
 
# print shape of the array
print("Shape of the array :",
      sample_array.shape)

sample_array2 = np.array([[0, 4, 2],
                       [3, 4, 5],
                       [23, 4, 5],
                       [2, 34, 5],
                       [5, 6, 7]])
 
print(sample_array2)
print("shape of the array :",
      sample_array2.shape)

Numpy array :
[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]
Shape of the array : (3, 4)
[[ 0  4  2]
 [ 3  4  5]
 [23  4  5]
 [ 2 34  5]
 [ 5  6  7]]
shape of the array : (5, 3)


# Import module
import numpy as np
 
# Creating the array
sample_array_1 = np.array([[0, 4, 2]])
 
sample_array_2 = np.array([0.2, 0.4, 2.4])
 
# display data type
print("Data type of the array 1 :",
      sample_array_1.dtype)
 
print("Data type of array 2 :",
      sample_array_2.dtype)

Data type of the array 1 : int64
Data type of array 2 : float64


# import module
import numpy as np
 
#creating a array
arr = np.array([3,4,5,5])
print("Array :",arr)

Array : [3 4 5 5]


#Import numpy module
import numpy as np
 
# iterable
iterable = (a*a for a in range(8))
arr = np.fromiter(iterable, float)
print("fromiter() array :", arr)

fromiter() array : [ 0.  1.  4.  9. 16. 25. 36. 49.]


import numpy as np
var = "Geekforgeeks"
arr = np.fromiter(var, dtype = 'U2')
print("fromiter() array :", arr)

fromiter() array : ['G' 'e' 'e' 'k' 'f' 'o' 'r' 'g' 'e' 'e' 'k' 's']


import numpy as np
print(np.arange(1, 20 , 2, dtype = np.float32))

[ 1.  3.  5.  7.  9. 11. 13. 15. 17. 19.]


import numpy as np
print(np.linspace(3.5, 10, 3))

[ 3.5   6.75 10.  ]


import numpy as np
print(np.empty([4, 3], dtype = np.int32, order = 'f'))

[[4 4 4]
 [0 0 0]
 [4 4 4]
 [0 0 0]]


import numpy as np
print(np.ones([4, 3], dtype = np.int32, order = 'f'))

[[1 1 1]
 [1 1 1]
 [1 1 1]
 [1 1 1]]


import numpy as np
print(np.zeros([4, 3], dtype = np.int32, order = 'f'))

[[0 0 0]
 [0 0 0]
 [0 0 0]
 [0 0 0]]


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'Name':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'Age': [24, 23, 22, 19, 10]}
data

{'Name': ['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
 'Age': [24, 23, 22, 19, 10]}


# Calling the pandas data frame method by passing the dictionary (data) as a parameter
df = pd.DataFrame(data)
df


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'Name':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'Age': [24, 23, 22, 19, 10]}
# Calling the pandas data frame method by passing the dictionary (data) as a parameter
df = pd.DataFrame(data)
# Selecting column
df[['Name']]


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'Name':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'Age': [24, 23, 22, 19, 10]}
# Calling the pandas data frame method by passing the dictionary (data) as a parameter
df = pd.DataFrame(data)
row = df.loc[1]
row

Name    Tanu
Age       23
Name: 1, dtype: object


row = df.iloc[1, :]
row

Name    Tanu
Age       23
Name: 1, dtype: object


age = df.iloc[1, 1]
age

23


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'Name':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'Age': [24, 23, 22, 19, 10]}
data

{'Name': ['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
 'Age': [24, 23, 22, 19, 10]}


# Calling the pandas data frame method by passing the dictionary (data) as a parameter
df = pd.DataFrame(data)
# Selecting the data from the column
df['Age']

0    24
1    23
2    22
3    19
4    10
Name: Age, dtype: int64


# Select rows which have ages > 19
df[df['Age'] > 19]


del df['Age']
df


df.insert(1, 'name', df['Name'])
df


# importing both pandas and numpy libraries
import pandas as pd
import numpy as np

# Dictionary of key pair values called data
data ={'Name':['Tanu', np.nan],
       'Age': [23, np.nan]}
data

{'Name': ['Tanu', nan], 'Age': [23, nan]}


df = pd.DataFrame(data)
df


# using the isnull() function
df.isnull()


df.fillna(0)


df.fillna(0)


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'NAMe':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'AGe': [24, 23, 22, 19, 10]}
data

{'NAMe': ['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
 'AGe': [24, 23, 22, 19, 10]}


# Calling the pandas data frame method by passing the dictionary (data) as a parameter
df = pd.DataFrame(data)
df


newcols = {
            'NAMe': 'Name',
            'AGe': 'Age'
          }
# Use `rename()` to rename your columns
df.rename(columns=newcols, inplace=True)
df


# The values of new index
newindex = {
            0: 'a',
            1: 'b',
            2: 'c',
            3: 'd',
            4: 'e'
}
# Rename your index
df.rename(index=newindex)


# import the pandas library
import pandas as pd
# Dictionary of key pair values called data
data = {'Name':['Ashika', 'Tanu', 'Ashwin', 'Mohit', 'Sourabh'],
        'Age': [24, 23, 22, 19, 10]}

df = pd.DataFrame(data)
print(df)
# Write to csv
df.to_csv('myDataFrame.csv')

# If you don't want to include row index
df.to_csv('myDataFrame_noidx.csv', index=False)

      Name  Age
0   Ashika   24
1     Tanu   23
2   Ashwin   22
3    Mohit   19
4  Sourabh   10


# read from csv
df = pd.read_csv('myDataFrame.csv', header=None, nrows=5)
print(df)

     0       1    2
0  NaN    Name  Age
1  0.0  Ashika   24
2  1.0    Tanu   23
3  2.0  Ashwin   22
4  3.0   Mohit   19


# when header=None, the column names are indices
df = pd.read_csv('myDataFrame_noidx.csv', header=None, nrows=5)
print(df)

        0    1
0    Name  Age
1  Ashika   24
2    Tanu   23
3  Ashwin   22
4   Mohit   19


# If you don't want column names to be indices, please explicit set header=0
df = pd.read_csv('myDataFrame_noidx.csv', header=0, nrows=5)
print(df)

      Name  Age
0   Ashika   24
1     Tanu   23
2   Ashwin   22
3    Mohit   19
4  Sourabh   10


import pandas as pd
import numpy as np

# There is an "A" in the "Rate" column which should be numeric value
data1 = {'id'   : [1,2,3,4,5],
         'Rate' : [5,9,3,'A',6],
         'Name' : ['a','b','c','d','e']}

df = pd.DataFrame(data1)

print(df)

   id Rate Name
0   1    5    a
1   2    9    b
2   3    3    c
3   4    A    d
4   5    6    e


df['Rate'] = pd.to_numeric(df['Rate'], errors='coerce') * 2
print(df)

   id  Rate Name
0   1  10.0    a
1   2  18.0    b
2   3   6.0    c
3   4   NaN    d
4   5  12.0    e


import pandas
import scipy
import numpy
from sklearn.preprocessing import MinMaxScaler

# data values
X = [ [110, 200], [120, 800], [310, 400], [140, 900], [510, 200], [653, 400] ,[310, 880] ]

# transofrm data
scaler = MinMaxScaler(feature_range=(0, 1))
rescaledX = scaler.fit_transform(X)

# summarize transformed data
numpy.set_printoptions(precision=2)
print(rescaledX[0:6,:])

[[0.   0.  ]
 [0.02 0.86]
 [0.37 0.29]
 [0.06 1.  ]
 [0.74 0.  ]
 [1.   0.29]]

A Tutorial about Python Basics¶

Basic data structures (resource)¶

1) Lists¶

Creating a list¶

Adding elements¶

Deleting Elements¶

Accessing Elements¶

Other Functions¶

2) Dictionaries¶

Creating a Dictionary¶

Changing and Adding key, value pairs¶

Deleting key, value pairs¶

Accessing Elements¶

Other Functions¶

3) Tuples¶

Creating a Tuple¶

Accessing Elements¶

Appending Elements¶

Other Functions¶

4) Sets¶

Creating a set¶

Adding elements¶

Operations in sets¶

Basics of Numpy¶

One Dimensional Array¶

Multi-Dimensional Array¶

Anatomy of an array¶

Data type objects (dtype):¶

Some different way of creating Numpy Array :¶

Basics of Pandas¶

Basic operations that can be appilied on a pandas Data Frame are as shown below:¶

Creating a pandas DataFrame¶

Performing operations on Rows and Columns¶

Data Selection, addition, deletion¶

Working with missing data¶

Renaming the Columns or Indices of a DataFrame¶

Read from and write to CSV file¶

Handle numeric exceptions¶

Basic data processing with sklearn¶

Rescale the data¶

	Name	name
0	Ashika	Ashika
1	Tanu	Tanu
2	Ashwin	Ashwin
3	Mohit	Mohit
4	Sourabh	Sourabh

	Name	Age
0	False	False
1	True	True