We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 189a635 commit bd2c193Copy full SHA for bd2c193
1 file changed
python/housing_data/california_hcd_data.py
@@ -80,7 +80,11 @@ def load_california_hcd_data(
80
assert df["building_type"].isnull().sum() < 50
81
df = df[df["building_type"].notnull()]
82
83
- df = df.rename(columns={"YEAR": "year"}).astype({"year": str})
+ # Drop rows where YEAR is not parseable as an int
84
+ df = df.rename(columns={"YEAR": "year"})
85
+ df["year"] = pd.to_numeric(df["year"], errors="coerce").replace({np.nan: None})
86
+ df = df.dropna(subset=["year"])
87
+ df["year"] = df["year"].astype(int).astype(str)
88
89
places_df = _aggregate_to_geography(df, "place", data_path)
90
counties_df = _aggregate_to_geography(df, "county", data_path)
0 commit comments