import numpy as np
import pandas as pd
path=r"C:\Users\Tsinghua-yincheng\Desktop\SZday74"
pop=pd.read_csv(path+"\\"+"state-population.csv")
areas=pd.read_csv(path+"\\"+"state-areas.csv")
abbrevs=pd.read_csv(path+"\\"+"state-abbrevs.csv")
pop.head(5)
data:image/s3,"s3://crabby-images/23a6e/23a6e8bbc61b1355ccc53c74ecb4aae908adcdd7" alt="在这里插入图片描述"
areas.head(5)
data:image/s3,"s3://crabby-images/2012f/2012f315379d7c7c590e1135e2b62304fa717dff" alt="在这里插入图片描述"
abbrevs.head(5)
data:image/s3,"s3://crabby-images/cbea2/cbea26b1e3d24991674923197547f373aca5f185" alt="在这里插入图片描述"
display(pop.shape,areas.shape,abbrevs.shape)
data:image/s3,"s3://crabby-images/7e286/7e286b9f67abe16c42dc9b261a0467ce0276e51f" alt="在这里插入图片描述"
merged=pd.merge(pop,abbrevs,how="outer",
left_on="state/region",
right_on="abbreviation")
merged
data:image/s3,"s3://crabby-images/93d4b/93d4bf39012ed055bbc56fcc14ec81919afb960a" alt="在这里插入图片描述"
merged=merged.drop("abbreviation",axis=1)
merged
data:image/s3,"s3://crabby-images/57e62/57e6202f9b306a0162527b9905fcb5ffe3f0936a" alt="在这里插入图片描述"
merged.isnull().any()
data:image/s3,"s3://crabby-images/fe0a1/fe0a18b6814542bfd28128fad3fdb7fbf2408793" alt="在这里插入图片描述"
merged[merged["population"].isnull()]
data:image/s3,"s3://crabby-images/33b1a/33b1ac4422e5457904bda92c1cff9d2d3c2a6054" alt="在这里插入图片描述"
merged.loc[merged["state"].isnull(),"state/region"]
data:image/s3,"s3://crabby-images/5a0d2/5a0d2922791a82c23adae3a3c592bbed03abcaf0" alt="在这里插入图片描述"
merged.loc[merged["state"].isnull(),"state/region"].unique()
data:image/s3,"s3://crabby-images/80bf5/80bf571baee9e873dc8febc1014acabb1fee9441" alt="在这里插入图片描述"
merged.loc[merged["state/region"]=="PR","state"]="Puerto Rico"
merged.loc[merged["state/region"]=="USA","state"]=\
"United States"
merged.isnull().any()
data:image/s3,"s3://crabby-images/a6364/a6364baab91934eb6f2822873771ee6230e70b51" alt="在这里插入图片描述"
merged
data:image/s3,"s3://crabby-images/6bd79/6bd79dec576598d7b50c461012049e5f1aa43796" alt="在这里插入图片描述"
final=pd.merge(merged,areas,on="state",how="left")
final
data:image/s3,"s3://crabby-images/ffd35/ffd358d7c81e6970f96a058e69c7482579418883" alt="在这里插入图片描述"
final.shape
data:image/s3,"s3://crabby-images/c2bdf/c2bdf8237dec4605e44b8061fd533d46fe368efc" alt="在这里插入图片描述"
final.isnull().any()
data:image/s3,"s3://crabby-images/5176a/5176a8c2464937c10166dba825858907bf58629f" alt="在这里插入图片描述"
final["state"][final["area (sq. mi)"].isnull()]
data:image/s3,"s3://crabby-images/b4cbf/b4cbfbabedb76e70ee96e8173f9a7f57b9a2c059" alt="在这里插入图片描述"
final["state"][final["area (sq. mi)"].isnull()].unique()
data:image/s3,"s3://crabby-images/bad0f/bad0f1ff86a44f89ab2fe065ed41400318342f12" alt="在这里插入图片描述"
final.dropna(inplace=True)
final
data:image/s3,"s3://crabby-images/d21a6/d21a665fe83d3a35152cb95fbde6a9ee207d943c" alt="在这里插入图片描述"
final.isnull().any()
data:image/s3,"s3://crabby-images/dbebc/dbebc66ba07b42a7326820abaecde75ed6fabf9c" alt="在这里插入图片描述"
final
data:image/s3,"s3://crabby-images/c452d/c452d990361b4f22d65c9c1ef005c6aaf4aa7f5d" alt="在这里插入图片描述"
data2010=final.query("year==2010 & ages=='total'")
data2010
data:image/s3,"s3://crabby-images/fe3e2/fe3e2cb76dbc25eccb475cb104bdd2fa759d21bf" alt="在这里插入图片描述"
data2010.shape
data:image/s3,"s3://crabby-images/1bff8/1bff8b6a08e28452530a5c4ff002e561a4f25cf2" alt="在这里插入图片描述"
data2010.set_index("state",inplace=True)
data2010
data:image/s3,"s3://crabby-images/ef22c/ef22cb6f4b4aab8cf9689f31fd6602402471a5cb" alt="在这里插入图片描述"
density=data2010["population"].div(data2010["area (sq. mi)"])
density
data:image/s3,"s3://crabby-images/bac8c/bac8cce6e544eaf2665b5ed8f8fee838e764fc1d" alt="在这里插入图片描述"
density.sort_values(ascending=False,inplace=True)
density.head(10)
data:image/s3,"s3://crabby-images/f8beb/f8bebc55b7f53eb7c41013b90fae71e0d9bb6810" alt="在这里插入图片描述"
density.tail(10)
data:image/s3,"s3://crabby-images/03e8c/03e8c1cbe79a65d48181b68ce5af2f8c36fde273" alt="在这里插入图片描述"
|