#資料預處理
import pandas as pd
data_1 = data_1.append(pd.DataFrame([{'id':'002','name':'chi'}]))
data_1 = data_1.append(pd.DataFrame([{'id':'003','name':'david'}])).reset_index(drop=True)
data_1 = data_1.append(pd.DataFrame([{'id':'003','name':'david'}])).reset_index(drop=True)
data_1 = data_1.append(pd.DataFrame([{'id':'004','name':float('NaN')}])).reset_index(drop=True)
data_1
#查詢
data_1.duplicated('id')
#刪除
data_1=data_1.drop_duplicates('id')
data_1
#遺失值 NaN None
#查詢
data_1['name'].isnull()
#移除遺失值(留下非遺失值)
data_1=data_1[data_1['name'].notnull()]
data_1
遺失值 NaN None
#查詢
data_1['name'].isnull()
#移除遺失值(留下非遺失值)
data_1=data_1[data_1['name'].notnull()]
data_1
文章標籤
全站熱搜
