We begin by importing some helper functions.
from helper import *
url = 'https://en.wikipedia.org/wiki/List_of_helicopter_prison_escapes'
Now, let's get the data from the List of helicopter prison escapes Wikipedia article.
data = data_from_url(url)
Let's print the first three rows
for values in data:
print(values[:4])
[1971, 'Santa Martha Acatitla', 'Mexico', 'Yes'] [1973, 'Mountjoy Jail', 'Ireland', 'Yes'] [1978, 'United States Penitentiary, Marion', 'United States', 'No'] [1981, 'Fleury-Mérogis, Essonne, Ile de France', 'France', 'Yes'] [1981, 'Orsainville Prison, Quebec City', 'Canada', 'No'] [1983, 'Pentridge (HM Prison)', 'Australia', 'No'] [1985, 'Perry Correctional Institution, Pelzer, South Carolina', 'United States', 'Yes'] [1985, 'Cândido Mendes penitentiary, Ilha Grande, Rio de Janeiro', 'Brazil', 'Yes'] [1986, 'Prison de la Santé', 'France', 'Yes'] [1986, 'Federal Correctional Institution, Dublin', 'United States', 'Yes'] [1986, 'Prigione di Rebibbia, Roma', 'Italy', 'Yes'] [1987, 'Gartree (HM Prison)', 'United Kingdom', 'Yes'] [1988, 'Santa Fe prison', 'United States', 'Yes'] [1989, 'Federal Holding Facility, Miami, FL', 'United States', 'No'] [1989, 'Arkansas Valley Correctional Facility', 'United States', 'Yes'] [1990, 'Kent Penitentiary, British Columbia', 'Canada', 'Yes'] [1991, 'Rio Piedras State Penitentiary, Puerto Rico', 'Puerto Rico', 'Yes'] [1992, 'Lyon Prison', 'France', 'Yes'] [1992, 'Touraine Central Prison, Tours', 'France', 'No'] [1993, 'Touraine Central Prison, Tours', 'France', 'No'] [1996, 'High Security Prison, Santiago', 'Chile', 'Yes'] [1997, 'De Geerhorst jail', 'Netherlands', 'No'] [1999, 'Metropolitan Remand and Reception Centre', 'Australia', 'Yes'] [2000, 'Martin Treatment Center for Sexually Violent Predators, Martin County Florida', 'United States', 'Yes'] [2000, 'Lyon prison', 'France', 'Yes'] [2001, 'Luynes prison', 'France', 'Yes'] [2001, 'Draguignan prison', 'France', 'Yes'] [2001, 'Fresnes prison', 'France', 'No'] [2002, 'Parada Neto Penitentiary', 'Brazil', 'Yes'] [2002, 'Las Cucharas prison, Puerto Rico', 'United States', 'Yes'] [2003, 'Luynes prison', 'France', 'Yes'] [2005, 'France', 'France', 'No'] [2005, 'Aiton Prison', 'France', 'Yes'] [2006, 'Korydallos Prison', 'Greece', 'Yes'] [2007, 'Lantin Prison, Liège', 'Belgium', 'Yes'] [2007, 'Grasse prison', 'France', 'Yes'] [2007, 'Ittre prison', 'Belgium', 'No'] [2009, 'Korydallos Prison', 'Greece', 'Yes'] [2009, 'Domenjod Prison, Réunion', 'France', 'Yes'] [2009, 'Bruges', 'Belgium', 'Yes'] [2010, 'HM Prison Isle of Wight, Isle of Wight', 'United Kingdom', 'No'] [2012, 'Sheksna, Penal colony N17', 'Russia', 'Yes'] [2013, 'Trikala Prison, Trikala', 'Greece', 'No'] [2013, 'Saint-Jérôme Detention Facility, Quebec', 'Canada', 'Yes'] [2014, 'Orsainville Detention Facility, Quebec', 'Canada', 'Yes'] [2016, 'Thiva', 'Greece', 'No'] [2018, 'Réau, near Paris', 'France', 'Yes'] [2020, 'Forest prison, Brussels', 'Belgium', 'No']
index = 0
for row in data:
data[index] = row[:-1]
index += 1
print(data[:3])
[['August 19, 1971', 'Santa Martha Acatitla', 'Mexico', 'Yes', 'Joel David Kaplan Carlos Antonio Contreras Castro'], ['October 31, 1973', 'Mountjoy Jail', 'Ireland', 'Yes', "JB O'Hagan Seamus TwomeyKevin Mallon"], ['May 24, 1978', 'United States Penitentiary, Marion', 'United States', 'No', 'Garrett Brock TrapnellMartin Joseph McNallyJames Kenneth Johnson']]
date = "July 23, 2009"
year = fetch_year(date)
print(year)
2009
for row in data:
row[0] = fetch_year(row[0])
print(data[:2])
[[1971, 'Santa Martha Acatitla', 'Mexico', 'Yes', 'Joel David Kaplan Carlos Antonio Contreras Castro'], [1973, 'Mountjoy Jail', 'Ireland', 'Yes', "JB O'Hagan Seamus TwomeyKevin Mallon"]]
min_year = min(data, key=lambda x: x[0])[0]
max_year = max(data, key=lambda x: x[0])[0]
years=[]
for y in range(min_year, max_year+1):
years.append(y)
print(years)
[1971, 1972, 1973, 1974, 1975, 1976, 1977, 1978, 1979, 1980, 1981, 1982, 1983, 1984, 1985, 1986, 1987, 1988, 1989, 1990, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017, 2018, 2019, 2020]
attempts_per_year=[]
index = 0
for y in years:
attempts_per_year.append([])
attempts_per_year[index].append(y)
count=0
for row in data:
if(row[0] == y):
count += 1
attempts_per_year[index].append(count)
index += 1
print(attempts_per_year)
[[1971, 1], [1972, 0], [1973, 1], [1974, 0], [1975, 0], [1976, 0], [1977, 0], [1978, 1], [1979, 0], [1980, 0], [1981, 2], [1982, 0], [1983, 1], [1984, 0], [1985, 2], [1986, 3], [1987, 1], [1988, 1], [1989, 2], [1990, 1], [1991, 1], [1992, 2], [1993, 1], [1994, 0], [1995, 0], [1996, 1], [1997, 1], [1998, 0], [1999, 1], [2000, 2], [2001, 3], [2002, 2], [2003, 1], [2004, 0], [2005, 2], [2006, 1], [2007, 3], [2008, 0], [2009, 3], [2010, 1], [2011, 0], [2012, 1], [2013, 2], [2014, 1], [2015, 0], [2016, 1], [2017, 0], [2018, 1], [2019, 0], [2020, 1]]
%matplotlib inline
barplot(attempts_per_year)
1986, 2001, 2007 and 2009 have more prison escapes
countries_frequency = df["Country"].value_counts()
print_pretty_table(countries_frequency)
Country | Number of Occurrences |
---|---|
France | 15 |
United States | 8 |
Greece | 4 |
Belgium | 4 |
Canada | 4 |
Australia | 2 |
United Kingdom | 2 |
Brazil | 2 |
Italy | 1 |
Netherlands | 1 |
Russia | 1 |
Puerto Rico | 1 |
Ireland | 1 |
Chile | 1 |
Mexico | 1 |