Académique Documents
Professionnel Documents
Culture Documents
Dsbda 1
Dsbda 1
In [3]: weather.head(15)
Out[3]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir WindGus
2008-
0 Albury 13.4 22.9 0.6 NaN NaN W
12-01
2008-
1 Albury 7.4 25.1 0.0 NaN NaN WNW
12-02
2008-
2 Albury 12.9 25.7 0.0 NaN NaN WSW
12-03
2008-
3 Albury 9.2 28.0 0.0 NaN NaN NE
12-04
2008-
4 Albury 17.5 32.3 1.0 NaN NaN W
12-05
2008-
5 Albury 14.6 29.7 0.2 NaN NaN WNW
12-06
2008-
6 Albury 14.3 25.0 0.0 NaN NaN W
12-07
2008-
7 Albury 7.7 26.7 0.0 NaN NaN W
12-08
2008-
8 Albury 9.7 31.9 0.0 NaN NaN NNW
12-09
2008-
9 Albury 13.1 30.1 1.4 NaN NaN W
12-10
2008-
10 Albury 13.4 30.4 0.0 NaN NaN N
12-11
2008-
11 Albury 15.9 21.7 2.2 NaN NaN NNE
12-12
2008-
12 Albury 15.9 18.6 15.6 NaN NaN W
12-13
2008-
13 Albury 12.6 21.0 3.6 NaN NaN SW
12-14
2008-
14 Albury 9.8 27.7 NaN NaN NaN WNW
12-16
15 rows × 24 columns
In [4]: weather.tail()
Out[4]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir Win
2017-
142188 Uluru 3.5 21.8 0.0 NaN NaN E
06-20
2017-
142189 Uluru 2.8 23.4 0.0 NaN NaN E
06-21
2017-
142190 Uluru 3.6 25.3 0.0 NaN NaN NNW
06-22
2017-
142191 Uluru 5.4 26.9 0.0 NaN NaN N
06-23
2017-
142192 Uluru 7.8 27.0 0.0 NaN NaN SE
06-24
5 rows × 24 columns
In [5]: weather.columns
In [6]: print(len(weather.columns))
24
In [7]: weather.index
In [8]: weather.shape
(142193, 24)
Out[8]:
In [9]: weather.dtypes
In [10]: weather.columns.values
In [11]: weather.describe(include='all')
2013-
top Canberra NaN NaN NaN NaN NaN
12-01
11 rows × 24 columns
In [12]: weather['Date']
0 2008-12-01
Out[12]:
1 2008-12-02
2 2008-12-03
3 2008-12-04
4 2008-12-05
...
142188 2017-06-20
142189 2017-06-21
142190 2017-06-22
142191 2017-06-23
142192 2017-06-24
Name: Date, Length: 142193, dtype: object
In [13]: weather.sort_index(axis=1,ascending=False)
In [14]: weather.sort_index(axis=1,ascending=True)
2008-
0 NaN 8.0 NaN 22.0 71.0 Albury 2
12-01
2008-
1 NaN NaN NaN 25.0 44.0 Albury 2
12-02
2008-
2 2.0 NaN NaN 30.0 38.0 Albury 2
12-03
2008-
3 NaN NaN NaN 16.0 45.0 Albury 2
12-04
2008-
4 8.0 7.0 NaN 33.0 82.0 Albury 3
12-05
2017-
142188 NaN NaN NaN 27.0 59.0 Uluru 2
06-20
2017-
142189 NaN NaN NaN 24.0 51.0 Uluru 2
06-21
2017-
142190 NaN NaN NaN 21.0 56.0 Uluru 2
06-22
2017-
142191 NaN NaN NaN 24.0 53.0 Uluru 2
06-23
2017-
142192 2.0 3.0 NaN 24.0 51.0 Uluru 2
06-24
In [15]: weather.sort_values(by='Date')
2007-
44351 Canberra 8.0 24.3 0.0 3.4 6.3 NW
11-01
2007-
44352 Canberra 14.0 26.9 3.6 4.4 9.7 ENE
11-02
2007-
44353 Canberra 13.7 23.4 3.6 5.8 3.3 NW
11-03
2007-
44354 Canberra 13.3 15.5 39.8 7.2 9.1 NW
11-04
2007-
44355 Canberra 7.6 16.1 2.8 5.6 10.6 SSE
11-05
2017-
38814 WaggaWagga -0.1 12.7 0.0 NaN NaN SSW
06-25
2017-
32833 Sydney 7.6 19.3 0.0 3.4 9.4 W
06-25
2017-
29496 Richmond 2.7 20.0 0.2 NaN NaN W
06-25
2017-
26545 Penrith 3.1 20.0 0.0 NaN NaN SW
06-25
2017-
35838 SydneyAirport 6.8 19.5 0.0 3.4 9.4 WSW
06-25
In [16]: weather.iloc[5]
Date 2008-12-06
Out[16]:
Location Albury
MinTemp 14.6
MaxTemp 29.7
Rainfall 0.2
Evaporation NaN
Sunshine NaN
WindGustDir WNW
WindGustSpeed 56.0
WindDir9am W
WindDir3pm W
WindSpeed9am 19.0
WindSpeed3pm 24.0
Humidity9am 55.0
Humidity3pm 23.0
Pressure9am 1009.2
Pressure3pm 1005.4
Cloud9am NaN
Cloud3pm NaN
Temp9am 20.6
Temp3pm 28.9
RainToday No
RISK_MM 0.0
RainTomorrow No
Name: 5, dtype: object
In [17]: weather[10:15]
Out[17]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir WindGus
2008-
10 Albury 13.4 30.4 0.0 NaN NaN N
12-11
2008-
11 Albury 15.9 21.7 2.2 NaN NaN NNE
12-12
2008-
12 Albury 15.9 18.6 15.6 NaN NaN W
12-13
2008-
13 Albury 12.6 21.0 3.6 NaN NaN SW
12-14
2008-
14 Albury 9.8 27.7 NaN NaN NaN WNW
12-16
5 rows × 24 columns
In [18]: weather.loc[:,["Date"]]
Out[18]: Date
0 2008-12-01
1 2008-12-02
2 2008-12-03
3 2008-12-04
4 2008-12-05
... ...
142188 2017-06-20
142189 2017-06-21
142190 2017-06-22
142191 2017-06-23
142192 2017-06-24
In [19]: weather.iloc[:10, :]
Out[19]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir WindGust
2008-
0 Albury 13.4 22.9 0.6 NaN NaN W
12-01
2008-
1 Albury 7.4 25.1 0.0 NaN NaN WNW
12-02
2008-
2 Albury 12.9 25.7 0.0 NaN NaN WSW
12-03
2008-
3 Albury 9.2 28.0 0.0 NaN NaN NE
12-04
2008-
4 Albury 17.5 32.3 1.0 NaN NaN W
12-05
2008-
5 Albury 14.6 29.7 0.2 NaN NaN WNW
12-06
2008-
6 Albury 14.3 25.0 0.0 NaN NaN W
12-07
2008-
7 Albury 7.7 26.7 0.0 NaN NaN W
12-08
2008-
8 Albury 9.7 31.9 0.0 NaN NaN NNW
12-09
2008-
9 Albury 13.1 30.1 1.4 NaN NaN W
12-10
10 rows × 24 columns
Out[20]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir Win
2008-
0 Albury 13.4 22.9 0.6 NaN NaN W
12-01
2008-
1 Albury 7.4 25.1 0.0 NaN NaN WNW
12-02
2008-
2 Albury 12.9 25.7 0.0 NaN NaN WSW
12-03
2008-
3 Albury 9.2 28.0 0.0 NaN NaN NE
12-04
2008-
4 Albury 17.5 32.3 1.0 NaN NaN W
12-05
2017-
142188 Uluru 3.5 21.8 0.0 NaN NaN E
06-20
2017-
142189 Uluru 2.8 23.4 0.0 NaN NaN E
06-21
2017-
142190 Uluru 3.6 25.3 0.0 NaN NaN NNW
06-22
2017-
142191 Uluru 5.4 26.9 0.0 NaN NaN N
06-23
2017-
142192 Uluru 7.8 27.0 0.0 NaN NaN SE
06-24
Out[21]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir WindGust
2008-
0 Albury 13.4 22.9 0.6 NaN NaN W
12-01
2008-
1 Albury 7.4 25.1 0.0 NaN NaN WNW
12-02
2008-
2 Albury 12.9 25.7 0.0 NaN NaN WSW
12-03
2008-
3 Albury 9.2 28.0 0.0 NaN NaN NE
12-04
2008-
4 Albury 17.5 32.3 1.0 NaN NaN W
12-05
2008-
5 Albury 14.6 29.7 0.2 NaN NaN WNW
12-06
2008-
6 Albury 14.3 25.0 0.0 NaN NaN W
12-07
2008-
7 Albury 7.7 26.7 0.0 NaN NaN W
12-08
2008-
8 Albury 9.7 31.9 0.0 NaN NaN NNW
12-09
2008-
9 Albury 13.1 30.1 1.4 NaN NaN W
12-10
In [22]: weather.isnull()
Out[22]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir Wind
In [23]: weather.isna()
Out[23]: Date Location MinTemp MaxTemp Rainfall Evaporation Sunshine WindGustDir Wind
In [24]: weather.isnull().any()
Date False
Out[24]:
Location False
MinTemp True
MaxTemp True
Rainfall True
Evaporation True
Sunshine True
WindGustDir True
WindGustSpeed True
WindDir9am True
WindDir3pm True
WindSpeed9am True
WindSpeed3pm True
Humidity9am True
Humidity3pm True
Pressure9am True
Pressure3pm True
Cloud9am True
Cloud3pm True
Temp9am True
Temp3pm True
RainToday True
RISK_MM False
RainTomorrow False
dtype: bool
In [25]: weather.isnull().sum().sum()
316559
Out[25]:
In [26]: weather.isnull().sum(axis=1)
In [27]: weather.isna().sum()
Date 0
Out[27]:
Location 0
MinTemp 637
MaxTemp 322
Rainfall 1406
Evaporation 60843
Sunshine 67816
WindGustDir 9330
WindGustSpeed 9270
WindDir9am 10013
WindDir3pm 3778
WindSpeed9am 1348
WindSpeed3pm 2630
Humidity9am 1774
Humidity3pm 3610
Pressure9am 14014
Pressure3pm 13981
Cloud9am 53657
Cloud3pm 57094
Temp9am 904
Temp3pm 2726
RainToday 1406
RISK_MM 0
RainTomorrow 0
dtype: int64
In [28]: weather.Evaporation.isnull().sum()
60843
Out[28]:
In [30]: weather.info()
In [31]: print(weather.std())
MinTemp 6.403283
MaxTemp 7.117618
Rainfall 8.465173
Evaporation 4.188537
Sunshine 3.781525
WindGustSpeed 13.588801
WindSpeed9am 8.893337
WindSpeed3pm 8.803345
Humidity9am 19.051293
Humidity3pm 20.797772
Pressure9am 7.105476
Pressure3pm 7.036677
Cloud9am 2.887016
Cloud3pm 2.720633
Temp9am 6.492838
Temp3pm 6.937594
RISK_MM 8.477969
dtype: float64
/tmp/ipykernel_5332/3866207191.py:1: FutureWarning: The default value of numeric_o
nly in DataFrame.std is deprecated. In a future version, it will default to False.
In addition, specifying 'numeric_only=None' is deprecated. Select only valid colum
ns or specify the value of numeric_only to silence this warning.
print(weather.std())
In [32]: print(weather.median())
In [ ]: