DM-exp-1/4-2-3.py

11 lines
328 B
Python
Raw Normal View History

import pandas as pd
import numpy as np
inputfile = '5Preprocessing/1.xlsx' #销量数据路径
s = pd.read_excel(inputfile) #读入数据
print('数据输出为:\n',s)
#去除重复
data1 = s['x'].drop_duplicates()
print('数据输出为:\n',data1)
#缺失值中位数填补
data2=s['y'].fillna(s['y'].median())
print(data2)