注:只是随笔

 

import pandas as pd 

 

train = pd.read_csv()  读入scv格式的文件

train = train_set.drop(['EbayID','QuantitySold','SellerName'], axis=1) 去掉无用的features;

 

train.targer = train_set['QuantitySold']//获得成交信息

 

k,n=DataFrame.shape 

Return a tuple representing the dimensionality of the DataFrame.//获取成交 feature数量

 

# isSold: 拍卖成功为1, 拍卖失败为0

df = DataFrame(np.hstack((train,train_target[:, None])), columns=range(n_features) + ["isSold"])

_ = sns.pairplot(df[:50], vars=[2,3,4,10,13], hue="isSold", size=1.5)