# Pandas 笔记

# 文件的读取与保存

data = pd.read_csv("path/to/csv")
data.to_csv(filename, index=False)

all_features[numeric_features] = all_features[numeric_features].apply(lambda x: (x - x.mean()) / (x.std()))

对于其中的缺失值：

all_features[numeric_features] = all_features[numeric_features].fillna(0)

all_features = pd.get_dummies(all_features, dummy_na=True)

将生成的预测值与原 Id 列合并生成一个新的 DataFrame，之后生成提交文件：

submit_df = test_data[['Id']].copy()
submit_df['label'] = pd.Series(preds.reshape(1, -1)[0])
submit_df.to_csv(filename, index=False)