import pandas as pd
# 定义特征名称
# ['经度', '纬度', '住房年龄中位数', '房间总数', '卧室总数', '人口', '住户', '收入中位数', '房屋价值中位数']
column_names = ['longitude', 'latitude', 'housingMedianAge', 'totalRooms', 'totalBedrooms', 'population', 'households', 'medianIncome', 'medianHouseValue']
# 读取数据文件
data_path = r"E:\地理探测器\SHAP\CaliforniaHousing\cal_housing.data" # 根据实际情况修改路径
data = pd.read_csv(data_path, sep=',', header=None, names=column_names)
# 分离特征矩阵X和目标向量Y
X = data.drop('medianHouseValue', axis=1)
y = data['medianHouseValue']
11-16
1966

04-16
4773

01-11
4461
