import geopandas


district_gdf = geopandas.read_file("data/kgz_admbnda_adm2_moes_20181119.shp", encoding='utf-8')

# view the attribute information
district_gdf.head()


# view the geometry
district_gdf.plot()


# view the coordinate reference system
district_gdf.crs


# set the coordinate reference system
district_gdf.crs="EPSG:4326"


# reproject the coordinate system to another coordinate system
district_utm_gdf = district_gdf.to_crs("EPSG:32643")
# view the reprojected geometry
district_utm_gdf.plot()


# One way of accessing columns
district_gdf['ADM2_KY']


# alternate method for accessing a column
district_gdf.ADM2_KY


# select by attribute
selected_gdf = district_gdf[district_gdf['Shape_Area'] > 0.7]
selected_gdf


selected_gdf.plot()


# read in the csv file to a pandas dataframe
import pandas
settlements_df = pandas.read_csv("data/kgz_misc_popp.csv")
settlements_df.head()


# convert to geodataframe using the latitude and logitude columns
settlements_gdf = geopandas.GeoDataFrame(settlements_df, 
                                         geometry=geopandas.points_from_xy(settlements_df.longitude, 
                                                                           settlements_df.latitude))
# make sure the coordinate system is set
settlements_gdf.crs="EPSG:4326"
settlements_gdf.head()


# write to shapefile, making sure to set the encoding method to utf-8
settlements_gdf.to_file("data/settlements_xy.shp", encoding='utf-8')


# plot the met stations using the aimag boudaries as a background
ax = district_gdf.plot(color='white', edgecolor='black')
settlements_gdf.plot(ax=ax)


# spatial join
district_settlements_gdf = geopandas.sjoin(settlements_gdf, district_gdf, how="inner", op='intersects')
district_settlements_gdf.head()


# alter the settlements dataframe so that only the relevant columns are left
district_settlements_gdf = district_settlements_gdf[['ADM2_PCODE', 'geometry']]

# create a new column called count
# this contains values that will be added together to get the total count
district_settlements_gdf['count'] = 1

# group by AIMAGCODE using sum to aggregate the other columns
settlements_dissolve_gdf = district_settlements_gdf.dissolve(by='ADM2_PCODE', aggfunc='sum')
settlements_dissolve_gdf.head()


settlements_dissolve_gdf.plot(column='count');


# convert the dissolved stations geodataframe into a pandas dataframe and drop the geometry
settlements_dissolve_gdf = pandas.DataFrame(settlements_dissolve_gdf.drop(columns='geometry'))

# merge the dissolved stations onto the aimag geodataframe using attributes
district_gdf = district_gdf.merge(settlements_dissolve_gdf, on='ADM2_PCODE', how='left')

# if the are any distircts that don't have a count, they will have NaN in the column
# make sure these are converted to zero so they show up in the map
district_gdf['count'].fillna(0, inplace=True)
district_gdf.head()


import matplotlib.pyplot as plt

# set up the plot
fig, ax = plt.subplots(1, 1)
# set the size of the plot
fig.set_size_inches(10, 6)

# plot with more attributes
district_gdf.plot(column='count', 
                  ax=ax,
                  cmap='YlOrRd',
                  legend=True, 
                  legend_kwds={'label': "Number of settlements by district",
                               'orientation': "horizontal"})


# save the figure
fig.savefig('data/district_settlements.png', dpi=300, alpha=True)


exercise_gdf = district_gdf[district_gdf['ADM2_PCODE'] == 'KG04220000000']
exercise_gdf


# enter your code here

More Advanced Python Usage¶

Using shapefiles with GeoPandas¶

Exercises¶