在一些数值型类型的,常使用的特征
###连续型的统计特征,如均值、方差等
##传入:去掉id和label的DataFrame
##传出:特征DataFrame
def psfeatureTime(data):
#data = pd.Series(data)
# 均值
df_mean = data.mean(axis=1)
# 方差
df_var = data.var(axis=1)
# 标准差
df_std = data.std(axis=1)
# 均方根
df_rms = pow((pow(df_mean, 2) + pow(df_std, 2)),0.5)
# 偏度
df_skew = data.skew(axis=1)
# 峭度---这里好像是空值
df_kurt = data.kurt(axis=1)
df_median = data.median(axis=1)
df_sum = data.sum(axis=1)
column = ['df_mean', 'df_var', 'df_std', 'df_rms', 'df_skew', 'df_kurt','df_median', 'df_sum']
featuretime_list = pd.concat([df_mean, df_var, df_std, df_rms, df_skew, df_kurt ,df_median, df_sum],axis=1)
featuretime_list.columns = column
return featuretime_list