Location via proxy:   [ UP ]  
[Report a bug]   [Manage cookies]                
0% found this document useful (0 votes)
16 views

Data Loading- Jupyter Notebook

Copyright
© © All Rights Reserved
Available Formats
Download as PDF, TXT or read online on Scribd
0% found this document useful (0 votes)
16 views

Data Loading- Jupyter Notebook

Copyright
© © All Rights Reserved
Available Formats
Download as PDF, TXT or read online on Scribd
You are on page 1/ 15

2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [1]:

import pandas as pd

In [3]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")

In [4]:

df = pd.DataFrame(d)

In [8]:

print(df)

Unnamed: 0 Duration Pulse Maxpulse \


0 0 60 110 130 409.1 60.0 100.0 145.0
1 1 60 117 145 479.0 40.0 102.0 142.0
2 2 60 103 135 340.0 60.0 103.0 134.0
3 3 45 109 175 282.4 65.0 104.0 145.0
4 4 45 117 148 406.0 60.0 105.0 132.0
.. ... ... ... ...
164 164 60 105 140 290.8 NaN NaN NaN
165 165 60 110 145 300.4 NaN NaN NaN
166 166 60 115 145 310.2 NaN NaN NaN
167 167 75 120 150 320.4 NaN NaN NaN
168 168 75 125 150 330.4 NaN NaN NaN

Calories
0 409.0
1 445.0
2 451.0
3 431.0
4 421.0
.. ...
164 NaN
165 NaN
166 NaN
167 NaN
168 NaN

[169 rows x 5 columns]

In [9]:

print(df.to_string())

Unnamed: 0 Duration Pulse Maxpulse Calories


0 0 60 110 130 409.1 60.0 100.0 145.0 409.0
1 1 60 117 145 479.0 40.0 102.0 142.0 445.0
2 2 60 103 135 340.0 60.0 103.0 134.0 451.0
3 3 45 109 175 282.4 65.0 104.0 145.0 431.0
4 4 45 117 148 406.0 60.0 105.0 132.0 421.0
5 5 60 102 127 300.5 70.0 106.0 133.0 442.0
6 6 60 110 136 374.0 60.0 107.0 134.0 421.0
7 7 45 104 134 253.3 75.0 108.0 132.0 444.0
8 8 30 109 133 195.1 60.0 109.0 131.0 433.0
9 9 60 98 124 269.0 80.0 100.0 1125.0 422.0
10 10 60 103 147 329.3 60.0 110.0 124.0 411.0
11 11 60 100 120 250.7 85.0 111.0 123.0 455.0
12 12 60 106 128 345.3 60.0 112.0 121.0 544.0
13 13 60 104 132 379.3 90.0 114.0 131.0 644.0
14 14 60 98 123 275.0 60.0 115.0 142.0 NaN
15 15 60 98 120 215.2 95.0 116.0 142.0 534.0
16 16 60 100 120 300.0 60.0 117.0 153.0 645.0
17 17 45 90 112 NaN 40.0 118.0 163.0 5343.0
18 18 60 103 123 323 0 60 0 119 0 156 0 343 0
In [11]:

df.to_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.xlsx")

In [13]:

df.to_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.xlsx",index= False)

In [14]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.csv",index= False)

In [15]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.txt",index= False)

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 1/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [17]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.txt",index= False, sep = "\t")

In [18]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")
df = pd.DataFrame(d)
print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[128 rows x 4 columns]

In [21]:

df.loc[3]

Out[21]:

Duration 65.0
Pulse 104.0
Maxpulse 145.0
Calories 431.0
Name: 3, dtype: float64

In [24]:

df.loc[3,'Duration']

Out[24]:

65

In [25]:

df.loc[0:4]

Out[25]:

Duration Pulse Maxpulse Calories

0 60 100 145 409.0

1 40 102 142 445.0

2 60 103 134 451.0

3 65 104 145 431.0

4 60 105 132 421.0

In [27]:

df.loc[0:4,["Duration","Calories"]]

Out[27]:

Duration Calories

0 60 409.0

1 40 445.0

2 60 451.0

3 65 431.0

4 60 421.0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 2/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [30]:

df.loc[0:4,"Duration":"Calories"]

Out[30]:

Duration Pulse Maxpulse Calories

0 60 100 145 409.0

1 40 102 142 445.0

2 60 103 134 451.0

3 65 104 145 431.0

4 60 105 132 421.0

In [32]:

df.iloc[0:4,0:5]

Out[32]:

Duration Pulse Maxpulse Calories

0 60 100 145 409.0

1 40 102 142 445.0

2 60 103 134 451.0

3 65 104 145 431.0

In [120]:

df.iloc[0:4]

Out[120]:

Duration Pulse Maxpulse Calories

0 60 100.0 145.0 409.0

1 60 100.0 145.0 409.0

2 60 103.0 134.0 451.0

3 65 104.0 145.0 431.0

In [38]:

df.iloc[[0,9]]

Out[38]:

Duration Pulse Maxpulse Calories

0 60 100 145 409.0

9 80 100 1125 422.0

In [122]:

df.iloc[:11,0:3]

Out[122]:

Duration Pulse Maxpulse

0 60 100.0 145.0

1 60 100.0 145.0

2 60 103.0 134.0

3 65 104.0 145.0

4 60 105.0 132.0

5 70 106.0 133.0

6 60 107.0 134.0

7 75 108.0 132.0

8 60 109.0 131.0

9 80 100.0 1125.0

10 60 110.0 124.0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 3/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [43]:

print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[128 rows x 4 columns]

In [44]:

df.dropna()

Out[44]:

Duration Pulse Maxpulse Calories

0 60 100 145 409.0

1 40 102 142 445.0

2 60 103 134 451.0

3 65 104 145 431.0

4 60 105 132 421.0

... ... ... ... ...

123 60 160 135 452.0

124 60 161 135 451.0

125 60 162 134 543.0

126 60 163 132 543.0

127 60 164 131 421.0

124 rows × 4 columns

In [45]:

df.dropna(inplace = True)

In [47]:

df.fillna("missing")
print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343.0
19 45 120 153 345 0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 4/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [48]:

df.dropna(inplace = True)
print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343.0
19 45 120 153 345 0
In [49]:

print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[124 rows x 4 columns]

In [50]:

print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343.0
19 45 120 153 345 0
In [53]:

df.to_json("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.json")
print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[124 rows x 4 columns]

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 5/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [54]:

print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343.0
19 45 120 153 345 0
In [55]:

# If your JSON code is not in a file, but in a Python Dictionary, you can load it into a DataFrame directly:
data = {
"Duration":{
"0":60,
"1":60,
"2":60,
"3":45,
"4":45,
"5":60
},
"Pulse":{
"0":110,
"1":117,
"2":103,
"3":109,
"4":117,
"5":102
},
"Maxpulse":{
"0":130,
"1":145,
"2":135,
"3":175,
"4":148,
"5":127
},
"Calories":{
"0":409,
"1":479,
"2":340,
"3":282,
"4":406,
"5":300
}
}

df = pd.DataFrame(data)

print(df)

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 6/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [56]:

# The DataFrames object has a method called info(), that gives you more information about the data set.
print(df.info())

<class 'pandas.core.frame.DataFrame'>
Index: 6 entries, 0 to 5
Data columns (total 4 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 Duration 6 non-null int64
1 Pulse 6 non-null int64
2 Maxpulse 6 non-null int64
3 Calories 6 non-null int64
dtypes: int64(4)
memory usage: 240.0+ bytes
None

In [57]:

# Data cleaning means fixing bad data in your data set.

# Bad data could be:

# Empty cells
# Data in wrong format
# Wrong data
# Duplicates
# Empty cells can potentially give you a wrong result when you analyze data.

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.csv",index= False)
new_df = df.dropna()

print(new_df.to_string())

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

In [65]:

d = pd.read_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.csv")

new_df = df.dropna()

print(new_df.to_string())

df.dropna(inplace = True)

print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300
Duration Pulse Maxpulse Calories
0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

In [60]:

print(df)

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 7/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [61]:

d = pd.read_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.csv")
df = pd.DataFrame(d)
print(df)

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

In [62]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.csv",index= False)
print(df)

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

In [64]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata1.txt",index= False,sep = "\t")


print(df)

Duration Pulse Maxpulse Calories


0 60 110 130 409
1 60 117 145 479
2 60 103 135 340
3 45 109 175 282
4 45 117 148 406
5 60 102 127 300

In [66]:

df.duplicated()

Out[66]:

0 False
1 False
2 False
3 False
4 False
5 False
dtype: bool

In [67]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")
df = pd.DataFrame(d)
print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[128 rows x 4 columns]

In [77]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata2.csv",index= False)

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 8/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [72]:

print(df)

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
.. ... ... ... ...
123 60 160 135 452.0
124 60 161 135 451.0
125 60 162 134 543.0
126 60 163 132 543.0
127 60 164 131 421.0

[128 rows x 4 columns]

In [73]:

df.duplicated()

Out[73]:

0 False
1 False
2 False
3 False
4 False
...
123 False
124 False
125 False
126 False
127 False
Length: 128, dtype: bool

In [78]:

print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
14 60 115 142 NaN
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343 0
In [76]:

df.dropna()
print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100 145 409.0
1 40 102 142 445.0
2 60 103 134 451.0
3 65 104 145 431.0
4 60 105 132 421.0
5 70 106 133 442.0
6 60 107 134 421.0
7 75 108 132 444.0
8 60 109 131 433.0
9 80 100 1125 422.0
10 60 110 124 411.0
11 85 111 123 455.0
12 60 112 121 544.0
13 90 114 131 644.0
14 60 115 142 NaN
15 95 116 142 534.0
16 60 117 153 645.0
17 40 118 163 5343.0
18 60 119 156 343 0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 9/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [90]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")
df = pd.DataFrame(d)
print(df)

Duration Pulse Maxpulse Calories


0 60 100.0 145.0 409.0
1 60 100.0 145.0 409.0
2 60 103.0 134.0 451.0
3 65 104.0 145.0 431.0
4 60 105.0 132.0 421.0
.. ... ... ... ...
123 60 160.0 135.0 452.0
124 60 161.0 135.0 451.0
125 60 162.0 134.0 543.0
126 60 163.0 132.0 543.0
127 60 164.0 131.0 421.0

[128 rows x 4 columns]

In [82]:

df.dropna()
print(df.to_string())

Duration Pulse Maxpulse Calories


0 60 100.0 145.0 409.0
1 60 100.0 145.0 409.0
2 60 103.0 134.0 451.0
3 65 104.0 145.0 431.0
4 60 105.0 132.0 421.0
5 70 106.0 133.0 442.0
6 60 107.0 134.0 421.0
7 75 108.0 132.0 444.0
8 60 109.0 131.0 433.0
9 80 100.0 1125.0 422.0
10 60 110.0 124.0 411.0
11 85 111.0 123.0 455.0
12 60 112.0 121.0 544.0
13 90 114.0 131.0 644.0
14 90 114.0 131.0 644.0
15 95 116.0 142.0 NaN
16 60 117.0 153.0 645.0
17 40 118.0 163.0 5343.0
18 60 N N 156 0 343 0
In [118]:

df.dropna(inplace = True)

In [119]:

df.fillna("missing")

Out[119]:

Duration Pulse Maxpulse Calories

0 60 100.0 145.0 409.0

1 60 100.0 145.0 409.0

2 60 103.0 134.0 451.0

3 65 104.0 145.0 431.0

4 60 105.0 132.0 421.0

... ... ... ... ...

123 60 160.0 135.0 452.0

124 60 161.0 135.0 451.0

125 60 162.0 134.0 543.0

126 60 163.0 132.0 543.0

127 60 164.0 131.0 421.0

122 rows × 4 columns

In [115]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")
df = pd.DataFrame(d)
df.dropna(inplace = True)

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 10/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [116]:

df.to_csv("C:\\Users\\Nisha\\OneDrive\\Desktop\\Newdata2.csv",index= False)
df.fillna(130, inplace = True)
#print(df)
# print(df.to_string())

In [98]:

df.duplicated()

Out[98]:

0 False
1 True
2 False
3 False
4 False
...
123 False
124 False
125 False
126 False
127 False
Length: 122, dtype: bool

In [99]:

df.drop_duplicates()

Out[99]:

Duration Pulse Maxpulse Calories

0 60 100.0 145.0 409.0

2 60 103.0 134.0 451.0

3 65 104.0 145.0 431.0

4 60 105.0 132.0 421.0

5 70 106.0 133.0 442.0

... ... ... ... ...

123 60 160.0 135.0 452.0

124 60 161.0 135.0 451.0

125 60 162.0 134.0 543.0

126 60 163.0 132.0 543.0

127 60 164.0 131.0 421.0

120 rows × 4 columns

In [100]:

df.drop_duplicates(inplace = True)

In [101]:

print(df)

Duration Pulse Maxpulse Calories


0 60 100.0 145.0 409.0
2 60 103.0 134.0 451.0
3 65 104.0 145.0 431.0
4 60 105.0 132.0 421.0
5 70 106.0 133.0 442.0
.. ... ... ... ...
123 60 160.0 135.0 452.0
124 60 161.0 135.0 451.0
125 60 162.0 134.0 543.0
126 60 163.0 132.0 543.0
127 60 164.0 131.0 421.0

[120 rows x 4 columns]

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 11/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [108]:

d = pd.read_excel("C:\\Users\\Nisha\\OneDrive\\Desktop\\data1.xlsx")
df = pd.DataFrame(d)
print(df)

Duration Pulse Maxpulse Calories


0 60 100.0 145.0 409.0
1 60 100.0 145.0 409.0
2 60 103.0 134.0 451.0
3 65 104.0 145.0 431.0
4 60 105.0 132.0 421.0
.. ... ... ... ...
123 60 160.0 135.0 452.0
124 60 161.0 135.0 451.0
125 60 162.0 134.0 543.0
126 60 163.0 132.0 543.0
127 60 164.0 131.0 421.0

[128 rows x 4 columns]

In [111]:

# Data filter using loc

df.loc[df["Maxpulse"]<135]

Out[111]:

Duration Pulse Maxpulse Calories

2 60 103.0 134.0 451.0

4 60 105.0 132.0 421.0

5 70 106.0 133.0 442.0

6 60 107.0 134.0 421.0

7 75 108.0 132.0 444.0

8 60 109.0 131.0 433.0

10 60 110.0 124.0 411.0

11 85 111.0 123.0 455.0

12 60 112.0 121.0 544.0

13 90 114.0 131.0 644.0

14 90 114.0 131.0 644.0

24 60 125.0 134.0 445.0

54 60 155.0 124.0 433.0

56 60 157.0 134.0 411.0

57 75 158.0 132.0 455.0

61 85 162.0 134.0 534.0

62 60 163.0 132.0 645.0

63 90 164.0 131.0 5343.0

66 60 103.0 134.0 345.0

68 60 105.0 132.0 3435.0

69 75 106.0 133.0 409.0

70 60 107.0 134.0 445.0

71 85 108.0 132.0 451.0

72 60 109.0 131.0 431.0

74 60 110.0 124.0 442.0

75 35 111.0 123.0 421.0

76 60 112.0 121.0 444.0

77 45 114.0 131.0 433.0

88 60 125.0 134.0 345.0

118 60 155.0 124.0 432.0

120 60 157.0 134.0 442.0

121 60 158.0 132.0 441.0

125 60 162.0 134.0 543.0

126 60 163.0 132.0 543.0

127 60 164.0 131.0 421.0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 12/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

In [126]:

# data filtering using logical condition

df.loc[(df["Maxpulse"]<135)|(df["Pulse"]<125)]

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 13/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook

Out[126]:

Duration Pulse Maxpulse Calories

0 60 100.0 145.0 409.0

1 60 100.0 145.0 409.0

2 60 103.0 134.0 451.0

3 65 104.0 145.0 431.0

4 60 105.0 132.0 421.0

5 70 106.0 133.0 442.0

6 60 107.0 134.0 421.0

7 75 108.0 132.0 444.0

8 60 109.0 131.0 433.0

9 80 100.0 1125.0 422.0

10 60 110.0 124.0 411.0

11 85 111.0 123.0 455.0

12 60 112.0 121.0 544.0

13 90 114.0 131.0 644.0

14 90 114.0 131.0 644.0

16 60 117.0 153.0 645.0

17 40 118.0 163.0 5343.0

19 45 120.0 153.0 345.0

20 60 121.0 152.0 345.0

21 50 122.0 153.0 355.0

23 55 124.0 146.0 409.0

24 60 125.0 134.0 445.0

54 60 155.0 124.0 433.0

56 60 157.0 134.0 411.0

57 75 158.0 132.0 455.0

61 85 162.0 134.0 534.0

62 60 163.0 132.0 645.0

63 90 164.0 131.0 5343.0

64 60 100.0 145.0 343.0

65 95 102.0 142.0 345.0

66 60 103.0 134.0 345.0

67 65 104.0 145.0 355.0

68 60 105.0 132.0 3435.0

69 75 106.0 133.0 409.0

70 60 107.0 134.0 445.0

71 85 108.0 132.0 451.0

72 60 109.0 131.0 431.0

73 95 100.0 1125.0 421.0

74 60 110.0 124.0 442.0

75 35 111.0 123.0 421.0

76 60 112.0 121.0 444.0

77 45 114.0 131.0 433.0

78 60 115.0 142.0 422.0

79 55 116.0 142.0 411.0

80 60 117.0 153.0 455.0

81 65 118.0 163.0 544.0

82 60 119.0 156.0 644.0

84 60 121.0 152.0 534.0

85 35 122.0 153.0 645.0

86 60 123.0 154.0 5343.0

87 40 124.0 146.0 343.0

88 60 125.0 134.0 345.0

118 60 155.0 124.0 432.0

120 60 157.0 134.0 442.0

121 60 158.0 132.0 441.0

125 60 162.0 134.0 543.0

126 60 163.0 132.0 543.0

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 14/15
2/4/23, 1:43 PM Untitled7 - Jupyter Notebook
Duration Pulse Maxpulse Calories

127[124]: 60
In 164.0 131.0 421.0

df.loc[(df["Maxpulse"]>135)&(df["Pulse"]>145)]

Out[124]:

Duration Pulse Maxpulse Calories

45 35 146.0 162.0 3435.0

46 60 147.0 161.0 409.0

47 40 148.0 170.0 445.0

48 60 149.0 171.0 451.0

49 50 150.0 172.0 431.0

50 60 151.0 173.0 421.0

51 55 152.0 172.0 442.0

52 60 153.0 171.0 421.0

53 65 154.0 156.0 444.0

58 60 159.0 154.0 544.0

109 60 146.0 162.0 5343.0

110 60 147.0 161.0 343.0

111 60 148.0 170.0 345.0

112 60 149.0 171.0 345.0

113 60 150.0 172.0 355.0

114 60 151.0 173.0 3435.0

115 60 152.0 172.0 544.0

116 60 153.0 171.0 322.0

117 60 154.0 156.0 432.0

122 60 159.0 154.0 453.0

In [ ]:

df.loc[df["Maxpulse"]<135]

localhost:8892/notebooks/Untitled7.ipynb?kernel_name=python3 15/15

You might also like