import pandas as pd
import geopandas as gpd


rwi = pd.read_csv('jor_relative_wealth_index.csv')

# Use latitude and longitude to create geographic points
rwi = gpd.GeoDataFrame(rwi, 
                       geometry=gpd.points_from_xy(rwi['longitude'], rwi['latitude']))
rwi.set_crs('epsg:4326',inplace=True)


import matplotlib.pyplot as plt

fig, ax = plt.subplots(1, 1, figsize=(10,10))
# column='rwi' defines which column from our dataframe to color the points by
rwi.plot(ax=ax, column='rwi',legend=True)
ax.axis('off')
ax.set_title('Relative Wealth Index Values')
plt.show()


import requests
import rioxarray

def gather_worldpop_data(data_type, country_iso=None, year=2015):
    """
    Build the url to pull WorldPop data from the API

    Inputs:
        data_type (string): Data type options are 'pop' (population),
            'births', 'pregnancies', and 'urban_change'.capitalize
        country_iso (string): The 3-letter country code, if desired. Default
            will be global. 
        year (int): the 4-digit year of interest for data. Default will be
            2015.

    Return (str, rioxarray DataArray): returns the name of the .tif file
        downloaded onto your computer containing the data and the DataArray
        containing the population counts read in using rioxarray.
    """

    # Build the API url according to user selection
    url_base = "https://www.worldpop.org/rest/data"
    url = url_base + '/'  + data_type + '/wpgp'
    if country_iso:
        url = url + '?iso3=' + country_iso

    # Request the desired data; filter by year 
    json_resp = requests.post(url).json()
    json_resp = json_resp['data']['popyear' == year]
    # Obtain exact .geotiff file name for the desired data
    geotiff_file = json_resp['files'][0]
    print('Obtaining file',geotiff_file)

    geotiff_data = requests.get(geotiff_file)
    
    file_name = 'worldpop_' + country_iso + '_' + str(year) + '.tif'
    print('Writing to',file_name)
    with open(file_name,'wb') as f:
        f.write(geotiff_data.content)

    # Read in the WorldPop data as a GeoTIFF
    worldpop_raster = rioxarray.open_rasterio(file_name)

    return file_name, worldpop_raster


jordan_pop_file, jordan_pop = gather_worldpop_data('pop','JOR',2019)

Obtaining file https://data.worldpop.org/GIS/Population/Global_2000_2020/2000/JOR/jor_ppp_2000.tif
Writing to worldpop_JOR_2019.tif


jordan_pop = jordan_pop.squeeze().drop('spatial_ref').drop('band')
jordan_pop.name = 'population'
worldpop_pop_df = jordan_pop.to_dataframe().reset_index()
worldpop_pop_df.head()


# remove populations below 0
worldpop_pop_df = worldpop_pop_df[worldpop_pop_df['population'] > 0]
# convert lat/long to geometry
worldpop_pop_df['geometry'] = gpd.points_from_xy(worldpop_pop_df['x'], worldpop_pop_df['y'])

# convert to GeoDataFrame
worldpop_pop_gdf = gpd.GeoDataFrame(worldpop_pop_df)
worldpop_pop_gdf.head()


import matplotlib.pyplot as plt
fig, ax = plt.subplots(1, 1, figsize=(10,10))
# column='population' defines which column from our dataframe to color the points by
worldpop_pop_gdf.loc[:,('population','geometry')].plot(ax=ax, column='population',legend=True)
ax.axis('off')
ax.set_title('WorldPop Population Counts 2019')
plt.show()


pop = pd.read_csv('population_jor_2019-07-01.csv')
pop = gpd.GeoDataFrame(pop, geometry=gpd.points_from_xy(pop['Lon'], pop['Lat']))
pop.set_crs('epsg:4326',inplace=True)


fig, ax = plt.subplots(1, 1, figsize=(10,10))

# column='Population' identifies which column to use in coloring the points
pop.plot(ax=ax, column='Population',legend=True)
ax.axis('off')
ax.set_title('Population Density')
plt.show()


gadm_admin = gpd.read_file('./gadm36_JOR_shp/gadm36_JOR_2.shp')
gadm_admin.head()


fig, ax = plt.subplots(1, 1, figsize=(8,8))

# column='Population' identifies which column to use in coloring the points
gadm_admin.plot(ax=ax, column='NAME_1',legend=True,cmap='tab20')
ax.axis('off')
ax.set_title('Jordan Governorate and District Administrative Areas: GADM')
plt.show()


import geemap, ee

# Initialize or Authenticate GEE connection
try:
        ee.Initialize()
except Exception as e:
        ee.Authenticate()
        ee.Initialize()

# Obtain Jordan's level 2 admin data and convert to GeoDataFrame
jordan_admin = geemap.ee_to_geopandas(ee.FeatureCollection("FAO/GAUL/2015/level2").filter(ee.Filter.eq('ADM0_NAME', 'Jordan')))
jordan_admin.set_crs(4326, inplace=True)
jordan_admin.head()


fig, ax = plt.subplots(1, 1, figsize=(8,8))

# column='Population' identifies which column to use in coloring the points
jordan_admin.plot(ax=ax, column='ADM1_NAME',legend=True,cmap='tab20')
ax.axis('off')
ax.set_title('Jordan Governorate and District Administrative Areas: FAO GAUL')
plt.show()


# join all population records to their associated admin area
district_pop = gpd.sjoin(pop, jordan_admin.loc[:,('ADM2_NAME','geometry')], op='within', how='right')
# summarize dataset by admin area, taking the mean population for each
district_pop_gb = district_pop.groupby('ADM2_NAME').mean().reset_index()
# add the geometry back into the summarized data
district_pop_gb = district_pop_gb.merge(jordan_admin.loc[:,('ADM2_NAME','geometry')], on='ADM2_NAME')
# view the first 5 rows
district_pop_gb.head()


fig, ax = plt.subplots(1,1, figsize=(8,8))
nation = jordan_admin.dissolve(by='ADM0_NAME').reset_index()

# Create the base plots of the entire country for the number of admin level
# maps we want to create
nation.plot(ax=ax, color='lightgrey')
ax.axis('off')
    
# Create each admin level plot of population
district_pop_gb.plot(ax=ax, column='Population', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'Mean Population Density'})

ax.set_title('Mean Population Density by District', fontsize='xx-large')

# Save this plot as an image
plt.savefig('jordan_pop_districts.png', dpi=300)
plt.show()


# join all rwi records to their associated admin area
district_rwi = gpd.sjoin(rwi, jordan_admin.loc[:,('ADM2_NAME','geometry')], op='within', how='right')
# summarize dataset by admin area, taking the mean rwi for each
district_rwi_gb = district_rwi.groupby('ADM2_NAME').mean().reset_index()
# add the geometry back into the summarized dataset
district_rwi_gb = district_rwi_gb.merge(jordan_admin.loc[:,('ADM2_NAME','geometry')], on='ADM2_NAME')
# view the first five rows
district_rwi_gb.head()


fig, ax = plt.subplots(1,1, figsize=(8,8))
nation = jordan_admin.dissolve(by='ADM0_NAME').reset_index()

# Create the base plots of the entire country for the number of admin level
# maps we want to create
nation.plot(ax=ax, color='lightgrey')
ax.axis('off')
    
# Create each admin level plot of RWI
district_rwi_gb.plot(ax=ax, column='rwi', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'Mean RWI'})

ax.set_title('Mean Relative Wealth by District', fontsize='xx-large')

# Save this plot as an image
plt.savefig('jordan_rwi_districts.png', dpi=300)
plt.show()


from scipy.spatial import KDTree
from shapely.geometry import Point
import numpy as np 

# Define function to find nearest neighbor and join population and wealth datasets accordingly
def ckdnearest(gdA, gdB):
    # create arrays from each dataset to use in k-d trees
    nA = np.array(list(gdA.geometry.apply(lambda x: (x.x, x.y))))
    nB = np.array(list(gdB.geometry.apply(lambda x: (x.x, x.y))))
    # create k-d tree from dataset b
    btree = KDTree(nB)
    # find the nearest point in dataset b to each point in dataset a
    dist, idx = btree.query(nA, k=1)
    # select the nearest points in b identified in the row above
    gdB_nearest = gdB.iloc[idx].drop(columns="geometry").reset_index(drop=True)
    # join the nearest points from a and b as a geodataframe
    gdf = pd.concat(
        [
            gdA.reset_index(drop=True),
            gdB_nearest,
            pd.Series(dist, name='dist')
        ], 
        axis=1)

    return gdf


# Join according to nearest neighbor using function defined above
overlay = ckdnearest(pop, rwi)
# Clarify column names
overlay.columns = ['longitude_pop', 'latitude_pop', 'pop', 'geometry', 
                   'latitude_rwi', 'longitude_rwi', 'rwi', 'error', 'dist']

# Sum population densities for each location where relative wealth is provided
overlay = overlay.groupby(['latitude_rwi', 'longitude_rwi', 'rwi'], as_index=False)\
    .agg('sum')
# Clarify column names
overlay = overlay[['latitude_rwi', 'longitude_rwi', 'pop', 'rwi']]\
    .rename({'pop':'pop_weight'}, axis=1)
# Scale relative wealth by population to create weighted relative wealth
overlay['weighted_rwi'] = overlay['pop_weight']*overlay['rwi']

# Convert joined dataset to GeoDataFrame
overlay = gpd.GeoDataFrame(overlay, geometry=gpd.points_from_xy(overlay['longitude_rwi'], 
                                                                overlay['latitude_rwi']))
overlay.set_crs(4326,inplace=True)

# Show first 10 rows of dataset
overlay.head(10)


fig, ax = plt.subplots(1, 1, figsize=(10,10))

# column='Population' identifies which column to use in coloring the points
overlay.plot(ax=ax, column='weighted_rwi',legend=True)
ax.axis('off')
ax.set_title('Jordan Weighted Wealth Measures')
plt.show()


# Roll up full level 2 admin data to level 1 for processing 
# (if more than 2 admin levels, do this for each level above the lowest)
governorates = jordan_admin.dissolve(by='ADM1_NAME').reset_index()

maps = {}
# For each administrative level dataset, provide the name of the administrative unit layers 
# (ie, divisions, districts, counties, etc), the column name for the unique layer identifier 
# in your dataset, the column name for the unique layer in your dataset, and the name of the dataframe
for name, numberkey, namekey, df in [('governorates', 'ADM1_CODE', 'ADM1_NAME', governorates),
                                     ('districts', 'ADM2_CODE', 'ADM2_NAME', jordan_admin)]:
    
    # Join datasets so admin units are matched with the wealth measure points within unit boundaries
    grouped = gpd.sjoin(overlay, df, op='within', how='right')
    # Sum all wealth and population measures by administrative unit
    grouped = grouped.groupby(numberkey, as_index=False).agg('sum')

    # Create the final population-weighted wealth metric by dividing population value 
    grouped['rwi'] = grouped['weighted_rwi']/grouped['pop_weight']
    # Remove unneeded fields; rename
    grouped = grouped[[numberkey, 'rwi', 'pop_weight']]\
        .rename({'pop_weight':'pop'}, axis=1)
    # Re-join geometric areas for admin units    
    grouped = df[[numberkey, namekey, 'geometry']].merge(grouped, how='left', 
                                                         on=numberkey)
    
    # Identify any admin units which had no associated wealth data
    nulls = grouped[pd.isnull(grouped['rwi'])].copy()
    nonnulls = grouped[~pd.isnull(grouped['rwi'])].copy()
    
    # Label unassigned admin units with the mean of surrounding units
    imputed = []
    for index, row in nulls.iterrows():  
        neighbors = nonnulls[nonnulls.geometry.touches(row['geometry'])]
        imputed.append(neighbors['rwi'].mean())
    nulls['rwi'] = imputed

    # Rejoin assigned and estimated admin units
    grouped = pd.concat([nulls, nonnulls])
    maps[name] = grouped


maps['governorates'].head()


def store_as_file(df, country, admin_lvl_nm, file_type):
    """
    Store population weighted wealth measures for a given admin level
        as either csv or shp file 
    Inputs:
        df (DataFrame):  dataframe containing data to store
        country (str): string field of country name
        admin_lvl_nm (str): the name of administrative units at the given
            admin level (eg, 'division', 'district')
        file_type (str): file type to store as, either 'csv' or 'shp'
    """

    file_name = "weighted_wealth_" + country + "_" + admin_lvl_nm

    if file_type == 'csv':
        file_name = file_name + ".csv"
        df.to_csv(file_name)
        print('Saved {}'.format(file_name))
    elif file_type == 'shp':
        file_name = file_name + ".shp"
        file_gpf = gpd.GeoDataFrame(df)
        file_gpf.to_file(file_name)
        print('Saved {}'.format(file_name))
    else:
        print('Unknown file_type requested - select either "csv" or "shp"')


# For each admin level and file type desired, save files
for admin_lvl_nm, df in maps.items():
    for file_type in ['csv','shp']:
        store_as_file(df, 'jordan', admin_lvl_nm, file_type)

Saved weighted_wealth_jordan_governorates.csv
Saved weighted_wealth_jordan_governorates.shp
Saved weighted_wealth_jordan_districts.csv
Saved weighted_wealth_jordan_districts.shp


fig, ax = plt.subplots(1,2, figsize=(20,15))
ax = ax.flatten()
nation = jordan_admin.dissolve(by='ADM0_NAME').reset_index()

# Create the base plots of the entire country for the number of admin level
# maps we want to create
for a in range(len(ax)):
    nation.plot(ax=ax[a], color='lightgrey')
    ax[a].axis('off')
    
# Create each admin level plot
maps['governorates'].plot(ax=ax[0], column='rwi', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'Pop-Weighted RWI'})
maps['districts'].plot(ax=ax[1], column='rwi', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'Pop-Weighted RWI'})

ax[0].set_title('Population-Weighted RWI by Governorates', fontsize='xx-large')
ax[1].set_title('Population-Weighted RWI by Districts', fontsize='xx-large')

# Save this plot as an image
plt.savefig('jordan_wealth_maps.png', dpi=300)
plt.show()


dhs_jordan_household = pd.read_stata('./JO_2017-18_DHS_08192021_1422_166256/JOHR73DT/JOHR73FL.DTA',convert_categoricals=False)
dhs_jordan_household.head()


dhs_jordan_household = dhs_jordan_household.dropna(axis=1,how='all')
dhs_jordan_household.head()


stata_do = pd.read_table('./JO_2017-18_DHS_08192021_1422_166256/JOHR73DT/JOHR73FL.DO',
    # labels are in quotes, so initially split to just separate labels
    sep='"',
    # indicate there are no meaningful column names
    header=None,
    # add in temporary column names
    names=('to_split','label','unnamed'),
    # skip the first row (a stata infix command we don't need)
    skiprows=1,
    # only take the first 2327 rows of the do file - the rest define the possible values for each field
    nrows=2327)
stata_do.head()


stata_do[['na1','na2','code']] = stata_do['to_split'].str.split(expand=True)
stata_do.head()


rename_dict = dict(zip(stata_do['code'],stata_do['label']))
dhs_jordan_household = dhs_jordan_household.rename(columns=rename_dict)
dhs_jordan_household.head()


# ensure survey was completed
dhs_jordan_household_wealth = dhs_jordan_household[dhs_jordan_household['Result of household interview']==1]
# select only fields of interest for comparing wealth index values
dhs_jordan_household_wealth = dhs_jordan_household_wealth.loc[:,("Region","Wealth index combined")]
dhs_jordan_household_wealth.head()


dhs_jordan_household_wealth.columns = ['Governorate_ID','Region','Wealth index combined']
dhs_jordan_household_wealth.head()


dhs_jordan_household_wealth_gb = dhs_jordan_household_wealth.groupby(by='Governorate_ID').mean().reset_index()
dhs_jordan_household_wealth_gb.head()


name_govs = {11:  "Amman",12:  "Balqa",13:  "Zarqa",
    14:  "Madaba",21:  "Irbid",22:  "Mafraq",23:  "Jarash",
    24:  "Aljoon",31:  "Karak",32:  "Tafiela",33:  "Ma'an",
    34:  "Aqaba"}
    
name_govs_df = pd.DataFrame.from_dict(name_govs,orient='index',columns=['Governorate']).reset_index()
name_govs_df.head()


dhs_jordan_household_wealth_gb = dhs_jordan_household_wealth_gb.merge(name_govs_df,left_on='Governorate_ID',right_on='index')
dhs_jordan_household_wealth_gb


validate_dhs = maps['governorates'].merge(dhs_jordan_household_wealth_gb, left_on='ADM1_NAME',right_on='Governorate')
validate_dhs.head()


import seaborn as sns

fig, ax1 = plt.subplots(1,1,figsize=(8,8))

sns.regplot(x=validate_dhs['Wealth index combined'],y=validate_dhs['rwi'],ci=False,ax=ax1)
sns.scatterplot(x=validate_dhs['Wealth index combined'],y=validate_dhs['rwi'],hue=validate_dhs['ADM1_NAME'],ax=ax1)
ax1.set_title('Comparison of Pop-Weighted RWI against DHS Wealth Index')
ax1.set_xlabel('DHS Wealth Index')
ax1.set_ylabel('Population-Weighted RWI')

Text(0, 0.5, 'Population-Weighted RWI')


dhs_jordan_geo = gpd.read_file('./JO_2017-18_DHS_08242021_055_166256/JOGE71FL/JOGE71FL.shp')
dhs_jordan_geo.head()


dhs_jordan_geo_simp = dhs_jordan_geo.loc[:,('DHSCLUST','geometry')]


# select cluster number and wealth index from non-geocoded DHS data used in section above
dhs_jor_cluster = dhs_jordan_household.loc[:,('Cluster number','Wealth index combined')].groupby('Cluster number').mean().reset_index()
dhs_jor_cluster


# join geocoded DHS records with DHS survey values on cluster number
dhs_jordan_geo_wi = dhs_jordan_geo_simp.merge(dhs_jor_cluster,left_on='DHSCLUST',right_on='Cluster number')
dhs_jordan_geo_wi.head()


district_dhs = gpd.sjoin(dhs_jordan_geo_wi, jordan_admin.loc[:,('ADM2_NAME','geometry')], op='within', how='right')
# summarize dataset by admin area, taking the mean wealth index for each
district_dhs_gb = district_dhs.groupby('ADM2_NAME').mean().reset_index()
# view the first 5 rows
district_dhs_gb.head()


district_dhs_val = maps['districts'].merge(district_dhs_gb,on='ADM2_NAME')
district_dhs_val.head()


import seaborn as sns

fig, ax1 = plt.subplots(1,1,figsize=(8,8))

sns.regplot(x=district_dhs_val['Wealth index combined'],y=district_dhs_val['rwi'],ci=False,ax=ax1)
ax1.set_title('Comparison of Pop-Weighted RWI against DHS Wealth Index')
ax1.set_xlabel('DHS Wealth Index')
ax1.set_ylabel('Population-Weighted RWI')

Text(0, 0.5, 'Population-Weighted RWI')


fig, ax = plt.subplots(1,2, figsize=(12, 6))
ax = ax.flatten()
nation = jordan_admin.dissolve(by='ADM0_NAME').reset_index()

# Create the base plots of the entire country for the number of admin level
# maps we want to create
for a in range(len(ax)):
    nation.plot(ax=ax[a], color='lightgrey')
    ax[a].axis('off')
    
# Create each admin level plot
district_dhs_val.plot(ax=ax[0], column='rwi', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'Pop-Weighted RWI'})
district_dhs_val.plot(ax=ax[1], column='Wealth index combined', cmap='magma', legend=True, 
                       legend_kwds={'shrink':0.5, 'label':'DHS RWI'})

ax[0].set_title('Population-Weighted RWI by Districts', fontsize='xx-large')
ax[1].set_title('DHS RWI by Districts', fontsize='xx-large')

plt.show()


hies_2018 = pd.DataFrame({'governorate':['Jarash','Mafraq','Irbid',
    'Madaba','Zarqa','Balqa','Amman','Aqaba',"Ma'an",
    'Tafiela','Karak','Ajlun'],'expenditures':[9815.6,9470.2,11589.4,
    11387.1,11641.5,10232.6,14054.3,9447.8,10155.6,8631.6,10787.8,10771.0],
    'income':[9077.6,9138.7,10432.0,10413.9,9562.6,11450.9,12657.2,10303.3,
    9575.9,10133.2,11755.3,10050.6]})
hies_2018


maps['governorates']['ADM1_NAME']

0      Ajloon
1       Amman
2       Aqaba
3       Balqa
4       Irbid
5      Jarash
6       Karak
7       Ma'an
8      Madaba
9      Mafraq
10    Tafiela
11      Zarqa
Name: ADM1_NAME, dtype: object


# define new 'governorate_adj' field to store the adjusted names
hies_2018['ADM1_NAME'] = hies_2018['governorate']
# rename 'Ajlun' to 'Ajloon'
hies_2018['ADM1_NAME'] = np.where(hies_2018['governorate']=='Ajlun',\
    'Ajloon',hies_2018['ADM1_NAME'])
hies_2018


validate_hies = maps['governorates'].merge(hies_2018, on='ADM1_NAME')


fig, (ax1,ax2) = plt.subplots(1,2,figsize=(12,6))

sns.regplot(x=validate_hies['income'],y=validate_hies['rwi'],ci=False,ax=ax1)
sns.scatterplot(x=validate_hies['income'],y=validate_hies['rwi'],hue=validate_hies['ADM1_NAME'],ax=ax1)
ax1.set_title('Comparison of Pop-Weighted RWI against HIES Income')
ax1.set_xlabel('HIES Average Income')
ax1.set_ylabel('Population-Weighted RWI')

sns.regplot(x=validate_hies['expenditures'],y=validate_hies['rwi'],ci=False,ax=ax2)
sns.scatterplot(x=validate_hies['expenditures'],y=validate_hies['rwi'],hue=validate_hies['ADM1_NAME'],ax=ax2)
ax2.set_title('Comparison of Pop-Weighted RWI against HIES Expenditure')
ax2.set_xlabel('HIES Average Expenditure')
ax2.set_ylabel('Population-Weighted RWI')

Text(0, 0.5, 'Population-Weighted RWI')

	latitude	longitude	rwi	error	geometry
0	32.110495	35.804443	0.602	0.548	POINT (35.80444 32.11050)
1	31.700129	35.584717	0.454	0.555	POINT (35.58472 31.70013)
2	31.400535	35.716553	-0.189	0.498	POINT (35.71655 31.40053)
3	31.942840	35.848389	1.432	0.487	POINT (35.84839 31.94284)
4	32.184911	36.331787	0.464	0.549	POINT (36.33179 32.18491)
...	...	...	...	...	...
2782	32.685619	35.958252	0.103	0.564	POINT (35.95825 32.68562)
2783	30.817346	36.068115	-0.239	0.424	POINT (36.06812 30.81735)
2784	30.078601	35.211182	-0.258	0.544	POINT (35.21118 30.07860)
2785	31.475524	36.002197	-0.215	0.489	POINT (36.00220 31.47552)
2786	31.886886	35.584717	0.284	0.546	POINT (35.58472 31.88689)

	y	x	population
0	33.3675	34.957500	-99999.0
1	33.3675	34.958333	-99999.0
2	33.3675	34.959167	-99999.0
3	33.3675	34.960000	-99999.0
4	33.3675	34.960833	-99999.0

	y	x	population	geometry
4606	33.367500	38.795833	0.003340	POINT (38.79583 33.36750)
4607	33.367500	38.796667	0.003368	POINT (38.79667 33.36750)
9818	33.366667	38.794167	0.003384	POINT (38.79417 33.36667)
9819	33.366667	38.795000	0.003340	POINT (38.79500 33.36667)
9820	33.366667	38.795833	0.003384	POINT (38.79583 33.36667)

	Lat	Lon	Population	geometry
0	32.557361	35.861806	17.355776	POINT (35.86181 32.55736)
1	32.554583	35.860139	17.355776	POINT (35.86014 32.55458)
2	32.557917	35.866806	17.355776	POINT (35.86681 32.55792)
3	32.557639	35.854583	17.355776	POINT (35.85458 32.55764)
4	32.572361	35.861528	17.355776	POINT (35.86153 32.57236)
...	...	...	...	...
877193	32.106806	35.795417	4.363106	POINT (35.79542 32.10681)
877194	32.110972	35.774583	4.363106	POINT (35.77458 32.11097)
877195	32.105694	35.781528	4.363106	POINT (35.78153 32.10569)
877196	32.091250	35.775694	4.363106	POINT (35.77569 32.09125)
877197	32.109861	35.802639	4.363106	POINT (35.80264 32.10986)

	GID_0	NAME_0	GID_1	NAME_1	NL_NAME_1	GID_2	NAME_2	VARNAME_2	NL_NAME_2	TYPE_2	ENGTYPE_2	CC_2	HASC_2	geometry
0	JOR	Jordan	JOR.1_1	Ajlun	None	JOR.1.1_1	Ajloun	Ajlun	None	Nahia	Sub-Province	None	JO.AJ.AJ	POLYGON ((35.66704 32.24525, 35.67163 32.25445...
1	JOR	Jordan	JOR.1_1	Ajlun	None	JOR.1.2_1	Kofranjah	None	None	Nahia	Sub-Province	None	JO.AJ.KF	POLYGON ((35.78606 32.20119, 35.78002 32.19791...
2	JOR	Jordan	JOR.2_1	Amman	None	JOR.2.1_1	Amman	None	None	Nahia	Sub-Province	None	JO.AM.AM	POLYGON ((35.75007 31.86172, 35.75247 31.86657...
3	JOR	Jordan	JOR.2_1	Amman	None	JOR.2.2_1	Jizeh	Al-Jiza	None	Nahia	Sub-Province	None	JO.AM.JI	POLYGON ((35.90070 31.41894, 35.88734 31.43012...
4	JOR	Jordan	JOR.2_1	Amman	None	JOR.2.3_1	Mowaqqar	Al-Mwwqqar	None	Nahia	Sub-Province	None	JO.AM.MO	POLYGON ((36.44504 31.86145, 36.45634 31.84417...

ABSTRACT¶

INTRODUCTION¶

Introduction to Model-Derived Data Sources¶

Introduction to the Relative Wealth Indices¶

Introduction to Population Data¶

Introduction to Administrative Areas¶

Introduction to Geospatial Data and Tools¶

Data Structure¶

Python and Google Earth Engine for Earth Observation Data¶

POPULATION-WEIGHTED WEALTH MAPS¶

Data Ingestion¶

Relative Wealth Indices¶

Population Maps¶

WorldPop¶

Population Density Maps¶

Note on Population and Wealth Geographic Types¶

Administrative Areas¶

GADM¶

FAO GAUL 2015¶

Plot Population and RWI by Admin Area¶

Create Population-Weighted Wealth Maps¶

Validation¶

Demographic and Health Surveys¶

Admin Level 1 DHS (no geocoding)¶

Geocoded DHS¶

HIES¶

Conclusion¶

	geometry	ADM0_CODE	ADM0_NAME	ADM1_CODE	ADM1_NAME	ADM2_CODE	ADM2_NAME	DISP_AREA	EXP2_YEAR	STATUS	STR2_YEAR	Shape_Area	Shape_Leng
0	POLYGON ((35.59864 32.30641, 35.59948 32.29984...	130	Jordan	1701	Ajloon	65716	Ajloon	NO	3000	Member State	2001	0.032220	1.092534
1	POLYGON ((35.03999 29.78441, 35.04312 29.78150...	130	Jordan	1703	Aqaba	65718	Wadi Araba	NO	3000	Member State	2001	0.217634	2.638096
2	POLYGON ((35.59573 31.98709, 35.60333 31.99011...	130	Jordan	1702	Balqa	65722	Al-Salt	NO	3000	Member State	2001	0.018047	0.649854
3	POLYGON ((35.70837 32.61929, 35.71080 32.61822...	130	Jordan	1707	Irbid	65740	Irbid	NO	3000	Member State	2001	0.023197	0.840361
4	POLYGON ((35.69533 31.29930, 35.69598 31.29446...	130	Jordan	1704	Karak	65724	Al-Qaser	NO	3000	Member State	2001	0.021907	0.734975

	ADM2_NAME	index_left	Lat	Lon	Population	geometry
0	Ail	276131.604677	30.068894	35.494057	3.653675	POLYGON ((35.31635 29.97787, 35.32536 29.97534...
1	Ajloon	517203.001791	32.350488	35.763963	9.638121	POLYGON ((35.59864 32.30641, 35.59948 32.29984...
2	Al-Aghwar Al-Janoobiya	518752.785079	31.136097	35.503990	6.602994	POLYGON ((35.36691 30.92314, 35.36833 30.92173...
3	Al-Aghwar Al-Shimaliya	373908.581950	32.576180	35.992499	7.238341	POLYGON ((35.88516 32.70881, 35.88813 32.70060...
4	Al-Ardha	415464.500666	31.972914	35.701233	6.309517	POLYGON ((35.58692 31.97971, 35.58924 31.97237...

	ADM2_NAME	index_left	latitude	longitude	rwi	error	geometry
0	Ail	1654.411765	30.042790	35.483901	0.253294	0.501294	POLYGON ((35.31635 29.97787, 35.32536 29.97534...
1	Ajloon	1459.133333	32.343695	35.741748	0.372467	0.537987	POLYGON ((35.59864 32.30641, 35.59948 32.29984...
2	Al-Aghwar Al-Janoobiya	1239.166667	31.138910	35.504557	-0.112648	0.510667	POLYGON ((35.36691 30.92314, 35.36833 30.92173...
3	Al-Aghwar Al-Shimaliya	1399.212121	32.576247	35.995872	0.243606	0.509167	POLYGON ((35.88516 32.70881, 35.88813 32.70060...
4	Al-Ardha	1333.071429	31.956155	35.693011	0.182571	0.500571	POLYGON ((35.58692 31.97971, 35.58924 31.97237...

	latitude_rwi	longitude_rwi	pop_weight	rwi	weighted_rwi	geometry
0	29.353451	34.991455	245.844278	0.081	19.913386	POINT (34.99146 29.35345)
1	29.353451	35.035400	106.532520	0.217	23.117557	POINT (35.03540 29.35345)
2	29.353451	35.057373	524.467792	0.637	334.085984	POINT (35.05737 29.35345)
3	29.372601	34.969482	12324.993123	0.976	12029.193288	POINT (34.96948 29.37260)
4	29.372601	34.991455	1524.234522	0.125	190.529315	POINT (34.99146 29.37260)
5	29.391747	34.969482	2237.182927	0.837	1872.522110	POINT (34.96948 29.39175)
6	29.391747	34.991455	1065.325203	0.535	569.948984	POINT (34.99146 29.39175)
7	29.391747	35.035400	106.532520	-0.163	-17.364801	POINT (35.03540 29.39175)
8	29.410890	34.969482	1966.754222	0.748	1471.132158	POINT (34.96948 29.41089)
9	29.410890	34.991455	549.052220	0.482	264.643170	POINT (34.99146 29.41089)

	ADM1_CODE	ADM1_NAME	geometry	rwi	pop
0	1701	Ajloon	POLYGON ((35.70369 32.21736, 35.69852 32.21098...	0.571924	2.034861e+05
1	1705	Amman	POLYGON ((36.57022 31.72390, 36.57620 31.71572...	0.902020	3.107416e+06
2	1703	Aqaba	POLYGON ((35.51787 29.27050, 35.48292 29.27587...	0.530247	1.589200e+05
3	1702	Balqa	MULTIPOLYGON (((35.69407 31.89742, 35.69169 31...	0.664370	9.657574e+05
4	1707	Irbid	POLYGON ((35.75544 32.42284, 35.75291 32.42523...	0.642397	1.467434e+06

	hhid	hv000	hv001	hv002	hv003	hv004	hv005	hv006	hv007	hv008	...	hc73_03	hc73_04	hc73_05	hc73_06	hc73_07	hc73_08	hc73_09	hc73_10	hc73_11	hc73_12
0	1 1	JO7	1	1	2	1	2241802	10	2017	1414	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
1	1 2	JO7	1	2	1	1	2241802	10	2017	1414	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
2	1 3	JO7	1	3	1	1	2241802	10	2017	1414	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
3	1 4	JO7	1	4	1	1	2241802	11	2017	1415	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
4	1 5	JO7	1	5	1	1	2241802	10	2017	1414	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN

	to_split	label	unnamed
0	label variable hhid	Case Identification	NaN
1	label variable hv000	Country code and phase	NaN
2	label variable hv001	Cluster number	NaN
3	label variable hv002	Household number	NaN
4	label variable hv003	Respondent's line number (answering Household ...	NaN

	to_split	label	unnamed	na1	na2	code
0	label variable hhid	Case Identification	NaN	label	variable	hhid
1	label variable hv000	Country code and phase	NaN	label	variable	hv000
2	label variable hv001	Cluster number	NaN	label	variable	hv001
3	label variable hv002	Household number	NaN	label	variable	hv002
4	label variable hv003	Respondent's line number (answering Household ...	NaN	label	variable	hv003

	Governorate_ID	Region	Wealth index combined
0	11	1.0	3.476891
1	12	1.0	2.808511
2	13	1.0	2.348156
3	14	1.0	2.320438
4	21	2.0	2.691185

	DHSID	DHSCC	DHSYEAR	DHSCLUST	CCFIPS	ADM1FIPS	ADM1FIPSNA	ADM1SALBNA	ADM1SALBCO	ADM1DHS	...	DHSREGCO	DHSREGNA	SOURCE	URBAN_RURA	LATNUM	LONGNUM	ALT_GPS	ALT_DEM	DATUM	geometry
0	JO201700000001	JO	2017.0	1.0	JO	NULL	NULL	NULL	NULL	11.0	...	11.0	Amman	GPS	U	31.980907	35.910510	9999.0	909.0	WGS84	POINT (35.91051 31.98091)
1	JO201700000002	JO	2017.0	2.0	JO	NULL	NULL	NULL	NULL	11.0	...	11.0	Amman	GPS	U	31.975399	35.896461	9999.0	950.0	WGS84	POINT (35.89646 31.97540)
2	JO201700000003	JO	2017.0	3.0	JO	NULL	NULL	NULL	NULL	11.0	...	11.0	Amman	GPS	U	31.957432	35.901973	9999.0	855.0	WGS84	POINT (35.90197 31.95743)
3	JO201700000004	JO	2017.0	4.0	JO	NULL	NULL	NULL	NULL	11.0	...	11.0	Amman	GPS	U	31.973120	35.918679	9999.0	899.0	WGS84	POINT (35.91868 31.97312)
4	JO201700000005	JO	2017.0	5.0	JO	NULL	NULL	NULL	NULL	11.0	...	11.0	Amman	GPS	U	31.956353	35.924025	9999.0	880.0	WGS84	POINT (35.92403 31.95635)

	Cluster number	Wealth index combined
0	1	4.650000
1	2	4.000000
2	3	3.750000
3	4	3.500000
4	5	2.750000
...	...	...
965	966	2.000000
966	967	1.263158
967	968	2.200000
968	969	2.150000
969	970	1.263158

	governorate	expenditures	income
0	Jarash	9815.6	9077.6
1	Mafraq	9470.2	9138.7
2	Irbid	11589.4	10432.0
3	Madaba	11387.1	10413.9
4	Zarqa	11641.5	9562.6
5	Balqa	10232.6	11450.9
6	Amman	14054.3	12657.2
7	Aqaba	9447.8	10303.3
8	Ma'an	10155.6	9575.9
9	Tafiela	8631.6	10133.2
10	Karak	10787.8	11755.3
11	Ajlun	10771.0	10050.6

	governorate	expenditures	income	ADM1_NAME
0	Jarash	9815.6	9077.6	Jarash
1	Mafraq	9470.2	9138.7	Mafraq
2	Irbid	11589.4	10432.0	Irbid
3	Madaba	11387.1	10413.9	Madaba
4	Zarqa	11641.5	9562.6	Zarqa
5	Balqa	10232.6	11450.9	Balqa
6	Amman	14054.3	12657.2	Amman
7	Aqaba	9447.8	10303.3	Aqaba
8	Ma'an	10155.6	9575.9	Ma'an
9	Tafiela	8631.6	10133.2	Tafiela
10	Karak	10787.8	11755.3	Karak
11	Ajlun	10771.0	10050.6	Ajloon

	DHSCLUST	geometry	Cluster number	Wealth index combined
0	1.0	POINT (35.91051 31.98091)	1	4.65
1	2.0	POINT (35.89646 31.97540)	2	4.00
2	3.0	POINT (35.90197 31.95743)	3	3.75
3	4.0	POINT (35.91868 31.97312)	4	3.50
4	5.0	POINT (35.92403 31.95635)	5	2.75

	ADM2_NAME	index_left	DHSCLUST	Cluster number	Wealth index combined
0	Ail	863.428571	864.428571	864.428571	1.342982
1	Ajloon	642.963636	643.963636	643.963636	2.449250
2	Al-Aghwar Al-Janoobiya	746.444444	747.444444	747.444444	1.994444
3	Al-Aghwar Al-Shimaliya	407.500000	408.500000	408.500000	2.397198
4	Al-Ardha	NaN	NaN	NaN	NaN