[IT]/python.pandas
pandas.basic
givemebro
2020. 4. 6. 09:20
반응형
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
CARD_SUBWAY_MONTH_201905.txt
1.16MB
data =pd.read_csv('CARD_SUBWAY_MONTH_201905.txt')
data.head(20)
data.tail()
data.info()
data.describe()
data.index
data.columns
data['사용일자']
data.사용일자
# 같은 표현
data2=data[['승차총승객수','하차총승객수']]
data2
data2.values
# pandas ->numpy
data[data.승차총승객수<10]
data[data.사용일자==20190501]
len(data[data.사용일자==20190501])
#593
data[data.사용일자==20190501].shape
#(593, 7)
[[day, data[data.사용일자==day].shape[0]] for day in range(20190501,20190532)]
{day: data[data.사용일자==day].shape[0] for day in range(20190501,20190532)}
data.isnull()
#data.notnull()
data.isnull().sum()
반응형