from datascience import *
import numpy as np

%matplotlib inline
import matplotlib.pyplot as plots
plots.style.use('fivethirtyeight')


top_movies = Table.read_table('top_movies_2017.csv')
top_movies


ages = 2023 - top_movies.column('Year')
top_movies = top_movies.with_column('Age', ages)


my_bins = make_array(0, 5, 10, 15, 25, 40, 65, 105)


binned_data = top_movies.bin('Age', bins = my_bins)
binned_data


num_movies = sum(binned_data.column('Age count'))
num_movies

200


percents = binned_data.column('Age count')/num_movies * 100
binned_data = binned_data.with_column('Percent', percents)


binned_data


top_movies.hist('Age', bins = my_bins, unit = 'Year')


# Question: What is the height of the [40, 65] bin?

percent = binned_data.where('bin', 40).column('Percent').item(0)


width = 65 - 40


height = percent / width
height

1.14


def triple(x):
    return 3 * x


triple(3)

9


num = 4


triple(num)

12


triple(num * 5)

60

def functionname(Arguments_Parameters_Expressions_or_Values):     
      return return_expression


triple('ha')

'hahaha'


np.arange(4)

array([0, 1, 2, 3])


triple(np.arange(4))

array([0, 3, 6, 9])

def f(s):     
      return np.round(s / sum(s) * 100, 2)


def percent_of_total(s):
    return np.round(s / sum(s) * 100, 2)


first_four=make_array(1,2,3,4)
first_four

array([1, 2, 3, 4])


percent_of_total(first_four)

array([ 10.,  20.,  30.,  40.])


percent_of_total(make_array(1, 213, 38))

array([  0.4 ,  84.52,  15.08])


def hypotenuse(x, y):
    hypot_squared = (x ** 2 + y ** 2)
    hypot = hypot_squared ** 0.5
    return hypot


hypotenuse(1, 2)

2.23606797749979


hypotenuse(3, 4)

5.0


def hypotenuse(x,y):
    return (x ** 2 + y ** 2) ** 0.5


hypotenuse(9, 12)

15.0


def age(year):
    age = 2023 - year
    return age


age(1942)

81


def name_and_age(name, year):
    return name + ' is ' + str(age(year)) + ' years old.'


name_and_age('Joe', 1942)

'Joe is 81 years old.'


staff = Table().with_columns(
    'Person', make_array('Jim', 'Pam', 'Michael', 'Creed'),
    'Birth Year', make_array(1985, 1988, 1967, 1904)
)
staff


staff.apply(age, 'Birth Year')

array([ 38,  35,  56, 119])


make_array(age(staff.column('Birth Year').item(0)),
           age(staff.column('Birth Year').item(1)),
           age(staff.column('Birth Year').item(2)),
           age(staff.column('Birth Year').item(3)))

array([ 38,  35,  56, 119])


staff.apply(name_and_age, 'Person', 'Birth Year')

array(['Jim is 38 years old.', 'Pam is 35 years old.',
       'Michael is 56 years old.', 'Creed is 119 years old.'],
      dtype='<U24')

Title	Studio	Gross	Gross (Adjusted)	Year
Gone with the Wind	MGM	198676459	1796176700	1939
Star Wars	Fox	460998007	1583483200	1977
The Sound of Music	Fox	158671368	1266072700	1965
E.T.: The Extra-Terrestrial	Universal	435110554	1261085000	1982
Titanic	Paramount	658672302	1204368000	1997
The Ten Commandments	Paramount	65500000	1164590000	1956
Jaws	Universal	260000000	1138620700	1975
Doctor Zhivago	MGM	111721910	1103564200	1965
The Exorcist	Warner Brothers	232906145	983226600	1973
Snow White and the Seven Dwarves	Disney	184925486	969010000	1937

Lecture 9: Functions¶

Histogram Review¶

Defining Functions¶

The Anatomy of a Function¶

Functions are Type-Agnostic¶

Discussion Question¶

Functions Can Take Multiple Arguments¶

Example: A function that takes the year of birth of a person and produces their age in years.¶

Apply¶

bin	Age count
0	0
5	21
10	17
15	41
25	43
40	57
65	21
105	0

bin	Age count	Percent
0	0	0
5	21	10.5
10	17	8.5
15	41	20.5
25	43	21.5
40	57	28.5
65	21	10.5
105	0	0

Person	Birth Year
Jim	1985
Pam	1988
Michael	1967
Creed	1904