## WC_DF Initialisation

import pandas  ## This is the module for creating and manipulating DataFrames

WC_DF = pandas.read_csv("worldcities.csv")


top_5_cities = WC_DF["city"][:5]   ## selects the first 5 items of the "city" column.
top_5_cities


top_5_cities.index = list("abcde")
top_5_cities


top_5_cities.index


WC_DF["city"][:5].values


WC_DF.columns


list(WC_DF.columns)


WC_DF.iloc[1]


for i, row in WC_DF.iterrows():
    print(i, row['city_ascii'], row['lat'], row['lng'])
    if i >3: break


WC_DF.sort_values(by=["country"], ascending=True)[:10] # Sorts countries by alphabet


filtered_DF = WC_DF[ WC_DF['capital'] == 'admin'] # This keeps only administrative capitals
filtered_DF.head()


# Question 1a answer cell

def non_ascii_cities():
    pass
    # Modify to return a set of all non-ascii city names in the world_cities data


# Question 1b answer cell

def num_cities_occurring_n_times(n):
    pass
    # Modify to return a value according to the specification given above


def country_num_cities_dict():
    pass


# Question 1d answer cell

def largest_cities_dataframe(n):
    pass
    # Modify to return a list of the n cities with the largest population


# Complete question 1d in this cell

def big_cities_in_country(country, population): # country is a string argument
    pass # Edit this function to return a list, as specified above


## Question 1e Answer Code Cell

def country_total_cities_population(country):
    pass


# Q2a answer code cell

import pandas    ## This is the module for creating and manupulating DataFrames

# Here we have assigned the url of the quake datasource to the global variable 
# 'QUAKE_SOURCE' for your convenience.
QUAKE_SOURCE = ( "http://earthquake.usgs.gov/" +
                 "earthquakes/feed/v1.0/summary/all_day.csv" )


QUAKE_DF = None  ## Modify this line to import the data using Pandas


## If QUAKE_DF is a DataFrame, show the first 5 rows
try:
    if type(QUAKE_DF) == pandas.DataFrame:
        display(QUAKE_DF.head())
    else:
        print("QUAKE_DF is not a DataFrame")
except:
    print("QUAKE_DF has not been assigned a value")


def show_deep_quakes( depth ):
    # make deep_quakes DataFrame by selecting rows from QUAKE_DF
    deep_quakes = QUAKE_DF[ QUAKE_DF["depth"] >= depth ]  ## This is how you select rows by a condition
                                                          ## on one of the column values.
        
    print("Number of quakes of depth {} or deeper:".format(depth), 
           len(deep_quakes.index))     ## This finds the number of rows of the deep_quakes DataFrame
    
    display(deep_quakes.sort_values("depth", ascending=False))  ## Sort by descending depth value


try:
    show_deep_quakes(100)
except:
    print("Probably QUAKE_DF not correctly set")


try:
    QUAKE_DF["depth"].max()
except:
    print("Probably QUAKE_DF not correctly set")


try:
    QUAKE_DF["depth"].min()
except:
    print("Probably QUAKE_DF not correctly set")


# Complete question 2b answer cell

def powerful_quakes(mag):
    ## This is just returning an empty DataFrame you need to code it to return
    ## a DataFrame with all quakes of magnitude greater than or equal to mag
    return pandas.DataFrame()


# Question 2c answer cell

def most_powerful_n_quakes(n):
    pass 
    # Edit this function to make it return a DataFrame of 
    # the 'top n' quakes of the all_day.csv file


## Function to compute distance between locations (kilometres) 
# Returns the surface distance in meters, according to the Haversine formula,
# between two locations given as (latitude, longitude) coordinate pairs.

import math
def haversine_distance( loc1 , loc2 ): 
    '''finds the distance (m) between 2 locations, where locations are defined by
    longitudes and latitudes'''
    lat1, lon1 = loc1
    lat2, lon2 = loc2
    radius = 6371  # kilometers
    dlat = math.radians(lat2 - lat1)
    dlon = math.radians(lon2 - lon1)
    a = (math.sin(dlat / 2) * math.sin(dlat / 2) +
         math.cos(math.radians(lat1)) * math.cos(math.radians(lat2)) *
         math.sin(dlon / 2) * math.sin(dlon / 2))
    c = 2 * math.atan2(math.sqrt(a), math.sqrt(1 - a))
    d = radius * c
    return d


## 2d Answer Code Cell

def quake_distance_from_loc_dataframe(loc):
    ## Replace with code so that the function returns a DataFrame in accord with the
    ## specification given above
    pass


def effective_magnitude( magnitude, depth, surface_distance ):
    energy = 10**magnitude  # convert logarithmic magnitude to a linear energy value
    if depth < 1:   # Crude fix for small or negative depths (can occur where land is above sea level)
        depth = 1
    ## Calculate distance to source by Pythagorus (ignoring curvature of surface)
    dist_to_source_squared =  depth**2 + surface_distance**2
    ## Apply inverse square distance multiplier to get energy density at distance from source
    ## (Ignores damping effects)
    attenuated_energy = energy/dist_to_source_squared
    attenuated_magnitude =  math.log10(attenuated_energy) ## Convert back to a log base 10 scale
    return attenuated_magnitude

# Some test cases.
#effective_magnitude(9,100,500)
#effective_magnitude(6,50, 100)


def epicenter_magnitude( magnitude, depth ):
    return effective_magnitude( magnitude, depth, 0)


## 2e Answer Code Cell
def endangered_cities(min_population, min_effective_magnitude):
    ## Replace with code that fulfils the specification
    pass


from ipyleaflet import Map, basemaps, basemap_to_tiles, Circle, Polyline
from ipywidgets import Layout

LEEDS_LOC  = ( 53.8008,  -1.5491  ) # Here we define the longitude and latitude of Leeds
WORLD_MAP = Map(basemap=basemaps.OpenTopoMap, center=LEEDS_LOC, zoom=1.5,
                layout=Layout(height="500px")) # Here we create a map object centred on Leeds

WORLD_MAP


def draw_circle_on_map( a_map, location, radius = 1000, color="red", fill_color=None ):
    if not fill_color:
        fill_color = color
    circle = Circle()
    circle.location = location
    circle.radius = radius
    circle.color = color
    circle.fill_color = fill_color
    a_map.add_layer(circle)

# This will edit your previous map rather than produce a new one    
draw_circle_on_map(WORLD_MAP, LEEDS_LOC, color="green" ) 

def display_powerful_quakes_on_map(mag):
    powerful = powerful_quakes(3)
    for i, quake in powerful.iterrows():
        draw_circle_on_map( WORLD_MAP,
                            (quake["latitude"],quake["longitude"]), 
                            radius= 20000*int(quake["mag"]) )

display_powerful_quakes_on_map(3)

city	country	status
Pisa	Italy	ENDANGERED
Rome	Italy	SAFE
Milan	Italy	SAFE

Assignment 2¶

Data and Algorithms:¶

Cities and Earthquakes¶

an exercise in geographic data analysis¶

Last Modified: 5th October 2021 (BB)¶

Question 1: World Cities¶

Coding Techniques for Working with DataFrames¶

Loading data from a CSV file into a DataFrame¶

Getting the Data for this Question¶

Checking the contents of a DataFrame¶

Accessing DataFrame columns and rows¶

Iterrating through the rows of a DataFrame¶

Sorting the rows of a DataFrame¶

Note on encodings of the city name¶

Filtering DataFrames¶

Overview of Question 1 tasks¶

Question 1a¶

Question 1b¶

Question 1c¶

Question 1d¶

Question 1e¶

Question 1f¶

Question 2: Earthquakes - Web Access and Pandas DataFrames¶

Question 2a: Read in data file¶

You can use the following cell to test if you have read the quake data into QUAKE_DF¶

Note:¶

More examples of useful pandas functions¶

Question 2b: Find Powerful Quakes¶

Question 2c: Find n+ most powerful earthquakes¶

Note:¶

Distance between locations on the Earth's surface¶

Question 2d: Sort quakes by distance from a given location¶

Note:¶

Question 2e: Identifying Endangered Cities¶

Effect of an qarthquake at a distance from its epicenter¶

Specification of the endangered_cities function¶

Example Output:¶

Notes:¶

Optional Exercises¶

Constructing a city risk status alert DataFrame¶

Visualisation Exercise: display endangered cities on a map¶

More Ideas for Graphical Display¶

Coding Techniques for Working with `DataFrame`s¶

Loading data from a CSV file into a `DataFrame`¶

You can use the following cell to test if you have read the quake data into `QUAKE_DF`¶

More examples of useful `pandas` functions¶

Question 2c: Find `n+` most powerful earthquakes¶

Specification of the `endangered_cities` function¶

Constructing a city risk status alert `DataFrame`¶