# Libraries required for this tutorial
import pandas as pd
import numpy as np
from sklearn.linear_model import LinearRegression
from sklearn.preprocessing import PolynomialFeatures
import matplotlib.pyplot as plt
import seaborn as sns
import warnings
warnings.filterwarnings('ignore')


playoffs = pd.read_csv("phs_2019_playoffs.csv")
playoffs.head()


playoffs = playoffs.drop(['start_time', 'stage'], axis=1)


playoffs = playoffs[playoffs.hero != 'All Heroes']
playoffs.head()


tank = ['Reinhardt', 'Sigma', 'D.Va', 'Wrecking Ball', 'Orisa', 'Winston', 'Zarya', 'Roadhog']
support = ['Ana', 'Baptiste', 'Brigitte', 'Lúcio', 'Mercy', 'Moira', 'Zen']
damage = ['Ashe', 'Bastion', 'McCree', 'Genji', 'Hanzo', 'Junkrat', 'Mei', 'Pharah', 'Reaper', 
          'Soldier 76', 'Sombra', 'Symmetra', 'Torbjorn', 'Tracer', 'Widowmaker', 'Doomfist']


# Go through each row and label tank, support, or damage if hero exists in the role array
def label_role (row):
    if row['hero'] in tank:
        return 'tank'
    if row['hero'] in support:
        return 'support'
    if row['hero'] in damage:
        return 'damage'
    return 'error'

playoffs['role'] = playoffs.apply(lambda row: label_role(row), axis=1)


playoffs.head()


players = playoffs.player.unique()
players

array(['Elsa', 'JinMu', 'Kyo', 'YangXiaoLong', 'Yveltal', 'ameng',
       'Chara', 'Eileen', 'HOTBA', 'Rio', 'nero', 'shu', 'Happy',
       'Boombox', 'Poko', 'SADO', 'carpe', 'eqo', 'neptuNo', 'CoMa',
       'Envy', 'Gamsu', 'IZaYaKI', 'YOUNGJIN', 'diem', 'DDing', 'Bdosin',
       'Birdring', 'Fury', 'Gesture', 'Profit', 'QuaterMain', 'Fits',
       'Fleta', 'Marve1', 'Michelle', 'ryujehong', 'tobi', 'Haksal',
       'JJANU', 'SLIME', 'SeoMinSoo', 'TiZi', 'Twilight', 'BEBE', 'Bazzi',
       'GodsB', 'Guxue', 'Ria', 'iDK', 'BigG00se', 'Hydration', 'Shaz',
       'Surefour', 'Void', 'rOar', 'Adora', 'Decay', 'Guard', 'Anamo',
       'Fl0w3R', 'JJonak', 'Mano', 'MekO', 'SAEBYEOLBE', 'Libero',
       'Dogman', 'Erster', 'Gator', 'Masaa', 'Pokpo', 'babybay',
       'Choihyobin', 'STRIKER', 'Viol2t', 'moth', 'sinatraa', 'smurf',
       'Rascal', 'NUS', 'Architect', 'Nevix', 'super'], dtype=object)


append_player = [] # Tuple array we will use to store data

# Go through each player and gather all instances of specific data. Sum each set and place into tuple array
for p in players:
    x = playoffs.loc[playoffs['player'] == p]
    role = playoffs.loc[playoffs['player'] == p]['role']
    team = playoffs.loc[playoffs['player'] == p]['team']
    
    tp = x.loc[x['stat_name'] == 'Time Played']
    time_played = tp['stat_amount'].sum()
    
    dt = x.loc[x['stat_name'] == 'Deaths']
    deaths = dt['stat_amount'].sum()
    
    elim = x.loc[x['stat_name'] == 'Eliminations']
    eliminations = elim['stat_amount'].sum()
    
    fb = x.loc[x['stat_name'] == 'Final Blows']
    final_blows = fb['stat_amount'].sum()
    
    assi = x.loc[x['stat_name'] == 'Assists']
    assists = assi['stat_amount'].sum()
    
    alldd = x.loc[x['stat_name'] == 'All Damage Done']
    all_damage_done = alldd['stat_amount'].sum()
    
    db = x.loc[x['stat_name'] == 'Damage Blocked']
    damage_blocked = db['stat_amount'].sum()
    
    dt = x.loc[x['stat_name'] == 'Damage Taken']
    damage_taken = dt['stat_amount'].sum()
    
    herodd = x.loc[x['stat_name'] == 'Hero Damage Done']
    hero_damage_done = herodd['stat_amount'].sum()
    
    he = x.loc[x['stat_name'] == 'Healing Done']
    healing_done = he['stat_amount'].sum()
    
    append_player.append([p, role.iloc[0], team.iloc[0], time_played, eliminations, final_blows, assists, deaths, 
                          all_damage_done, hero_damage_done, damage_blocked, damage_taken, healing_done])


# Creating new dataframe using the tuple array from before, now maning columns based on data
player_stats = pd.DataFrame(append_player, columns = ['player', 'role', 'team', 'time_played', 'eliminations', 'final_blows', 
                                                      'assists', 'deaths', 'all_damage_done', 'hero_damage_done', 'damage_blocked', 'damage_taken', 'healing_done'])
player_stats.head()


# Store each column we want to calculate a per 10 mins value on
columns = ['eliminations', 'final_blows', 'assists', 'deaths', 'all_damage_done', 'hero_damage_done', 'damage_blocked', 'damage_taken', 'healing_done']

for c in columns:
    
    # Time is stored in seconds, use 600 seconds as 10 mins. Return the per 10 mins value
    def per_ten (row):
        return ((600 * row[c]) / row['time_played'])

    # Change existing row to be of units per 10 mins
    player_stats[c] = player_stats.apply(lambda row: per_ten(row), axis=1)


player_stats.head()


# Time stored in seconds, use 1200 seconds to remove all players with less than 20 minutes of playtime
player_stats = player_stats[player_stats['time_played'] >= 1200]
player_stats


# Separate players into three individual arrays based on role value
tank_df = player_stats[player_stats['role'] == 'tank']
damage_df = player_stats[player_stats['role'] == 'damage']
support_df = player_stats[player_stats['role'] == 'support']

tank_df.head()


colors = ["purple", "green", "blue", "pink", "brown", "red", "light blue", "teal", "orange", "light green", "magenta", "yellow", "grey", "dark green", "dark blue", 
          "tan", "cyan", "bright green", "lilac", "hot pink", "olive green", "mustard", "periwinkle", "light pink", "plum", "brick red", "dark brown", "chartreuse", 
          "dark orange", "slate", "sea blue", "twilight blue"]
new_palette = sns.xkcd_palette(colors)


# Graph each player's elimination to death value in a scatter plot. Each player will get their own color hue.
sns.lmplot(x="eliminations", y="deaths", data=tank_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=5, aspect=1.5, scatter_kws={"s": 75})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

#Use meaningful tites
plt.title('Eliminations vs. Deaths for Tank Players')
plt.xlabel('Eliminations / 10 mins')
plt.ylabel('Deaths / 10 mins')

Text(20.800000000000004, 0.5, 'Deaths / 10 mins')


# Make new column for tank_df that takes all damage taken over average hero health
tank_df['expected_deaths'] = tank_df.apply(lambda row: (row['damage_taken'] / (425)), axis=1)
tank_df.head()


# Graph each player's deaths to expected death value in a scatter plot
sns.lmplot(x="deaths", y="expected_deaths", data=tank_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=6, aspect=1, scatter_kws={"s": 75})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

#Use meaningful tites
plt.title('Actual Deaths vs. Expected Deaths for Tank Players')
plt.xlabel('actual deaths / 10 mins')
plt.ylabel('expected deaths / 10 mins')

Text(24.956250000000004, 0.5, 'expected deaths / 10 mins')


# New column where the value is the ratio of expected deaths:actual deaths
tank_df['tankiness'] = tank_df.apply(lambda row: (row['expected_deaths'] / row['deaths']), axis=1)
tank_df.head()


# Graph each players total damage to their damage blocked in a scatter plot
sns.lmplot(x="all_damage_done", y="damage_blocked", data=tank_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=6, aspect=1.25, scatter_kws={"s": 75})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

#Use meaningful titles
plt.title('All Damage Done vs. Damage Blocked for Tank Players')
plt.xlabel('all_damage_done / 10 mins')
plt.ylabel('damage_blocked / 10 mins')

Text(5.831250000000004, 0.5, 'damage_blocked / 10 mins')


# Get all values we want to normalize
columns = ['eliminations', 'final_blows', 'assists', 'deaths', 'all_damage_done', 'hero_damage_done', 'damage_blocked', 'damage_taken', 'tankiness']

for c in columns:
    
    # For each row, find the range of values to calculate each stat as a percentage of the total
    def norm_data (row):
        all_values = tank_df[c]
        range_values = all_values.max() - all_values.min()
    
        norm_values = (row[c] - all_values.min()) / range_values
    
        return norm_values

    # Change existing rows to instead contain normalized values of all column specified data
    tank_df[c] = tank_df.apply(lambda row: norm_data(row), axis=1)


tank_df.head()


# For each player, returns a PIR rating from formula 
def tank_pir (row):
    
    rating = (row['eliminations']) - row['deaths'] + row['all_damage_done'] + row['damage_blocked'] + row['tankiness']
    
    return rating

#Creates new row for each player that contains their PIR score with .apply
tank_df['PIR'] = tank_df.apply(lambda row: tank_pir(row), axis=1)


# Convert PIR to a float so it can be sorted, then store the sorted values in a new list
tank_df.PIR = tank_df.PIR.astype(float)
tank_ranks = tank_df.sort_values('PIR')


# Graph rankings of tank players based on PIR
sns.set(rc={'figure.figsize':(22,8.27)})
sns.barplot(data=tank_ranks, x="player", y="PIR")

<AxesSubplot:xlabel='player', ylabel='PIR'>


# Graph each damage player's eliminations and deaths in a scatter plot

sns.lmplot(x="eliminations", y="deaths", data=damage_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=6, aspect=2.5, scatter_kws={"s": 75})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

#Use meaningful titles
plt.title('Eliminations vs. Deaths for Damage Players')
plt.xlabel('Eliminations / 10 mins')
plt.ylabel('Deaths / 10 mins')

Text(25.960000000000008, 0.5, 'Deaths / 10 mins')


# Make the PairGrid
g = sns.PairGrid(damage_df.sort_values("eliminations", ascending=False),x_vars=damage_df.columns[4:7], y_vars=["player"],height=10, aspect=.55)

# Draw a dot plot using the stripplot function
g.map(sns.stripplot, size=10, orient="h", jitter=False, palette=new_palette, linewidth=1, edgecolor="w")

# Use the same x axis limits on all columns and add better labels
g.set(xlim=(0, 27), xlabel="per 10 mins", ylabel="")

# Use meaningful titles for the columns
titles = ["Eliminations", "Final Blows", "Assists"]

for ax, title in zip(g.axes.flat, titles):

    # Set a different title for each axes
    ax.set(title=title)

    # Make the grid horizontal instead of vertical
    ax.xaxis.grid(False)
    ax.yaxis.grid(True)

sns.despine(left=True, bottom=True)


# Create new column in damage_df where its value is hero damage over average hero health
damage_df['expected_elims'] = damage_df.apply(lambda row: (row['hero_damage_done'] / (291)), axis=1)
damage_df.head()


# Create new column in damage_df where its value is the ratio of expected elims:actual elims
damage_df['damage_eff'] = damage_df.apply(lambda row: (row['expected_elims'] / row['eliminations']), axis=1)
damage_df.head()


#Graph each damage players elims to expected elims in a scatter plot
sns.lmplot(x="eliminations", y="expected_elims", data=damage_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=8, aspect=1, scatter_kws={"s": 75})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

#Use meaningful tites
plt.title('Actual Eliminations vs. Expected Eliminations for Damage Players')
plt.xlabel('actual eliminations / 10 mins')
plt.ylabel('expected elims / 10 mins')

Text(29.334999999999994, 0.5, 'expected elims / 10 mins')


# Get each column we want to normalize
columns = ['eliminations', 'final_blows', 'assists', 'deaths', 'all_damage_done', 'hero_damage_done', 'damage_blocked', 'damage_taken', 'damage_eff']

for c in columns:
    
    # For each row, returns normalized value
    def norm_data (row):
        all_values = damage_df[c]
        range_values = all_values.max() - all_values.min()
    
        norm_values = (row[c] - all_values.min()) / range_values
    
        return norm_values

    # Change existing row to new normalized values
    damage_df[c] = damage_df.apply(lambda row: norm_data(row), axis=1)


damage_df.head()


# Returns damage PIR using formula provided
def damage_pir (row):
    
    rating = row['eliminations'] - row['deaths'] + (1 - row['damage_eff']) + row['assists'] + row['final_blows']
    
    return rating

# Create new row for PIR for each player
damage_df['PIR'] = damage_df.apply(lambda row: damage_pir(row), axis=1)


# Convert to float to make it easier to sort values. Store sorted values in new list.
damage_df.PIR = damage_df.PIR.astype(float)
damage_ranks = damage_df.sort_values('PIR')

#Graph first 16 players since sample size is large
sns.set(rc={'figure.figsize':(22,8.27)})
sns.barplot(data=damage_ranks.iloc[:16], x="player", y="PIR")

<AxesSubplot:xlabel='player', ylabel='PIR'>


# Graph last 15 players, starting at the player who ranked first in graph above.
sns.set(rc={'figure.figsize':(22,8.27)})
sns.barplot(data=damage_ranks.iloc[15:], x="player", y="PIR")

<AxesSubplot:xlabel='player', ylabel='PIR'>


# Graph eliminations vs deaths for each support player

sns.lmplot(x="eliminations", y="deaths", data=support_df, fit_reg=False, legend=False, hue='player', palette=new_palette, size=6, aspect=2.5, scatter_kws={"s": 100})
plt.legend(loc=9, bbox_to_anchor=(0.5, -0.2), ncol=5)

# Use relevant titles
plt.title('Eliminations vs. Deaths for Support Players')
plt.xlabel('Eliminations / 10 mins')
plt.ylabel('Deaths / 10 mins')

Text(25.960000000000008, 0.5, 'Deaths / 10 mins')


f, ax = plt.subplots(figsize=(6, 15))

# Plot the total healing
sns.set_color_codes("pastel")
support_healing = support_df.sort_values("healing_done", ascending=False)
sns.barplot(x="healing_done", y="player", data=support_healing, palette=new_palette, label="healing_done", color="g")

<AxesSubplot:xlabel='healing_done', ylabel='player'>


# Get each column we want to normalize data on
columns = ['eliminations', 'final_blows', 'assists', 'deaths', 'all_damage_done', 'hero_damage_done', 'damage_blocked', 'damage_taken', 'healing_done']

for c in columns:
    
    #Returns normalized values for each row provided
    def norm_data (row):
        all_values = support_df[c]
        range_values = all_values.max() - all_values.min()
    
        norm_values = (row[c] - all_values.min()) / range_values
    
        return norm_values
    
    #Change existing rows to instead include normalized values
    support_df[c] = support_df.apply(lambda row: norm_data(row), axis=1)


support_df.head()


# Returns support PIR based on formula provided
def support_pir (row):
    
    rating = row['eliminations'] - row['deaths'] + row['healing_done'] + row['assists'] + row['final_blows']
    
    return rating

#Create new row in support_df that contains PIR for each player
support_df['PIR'] = support_df.apply(lambda row: support_pir(row), axis=1)


# Graph sorted support PIR
support_df.PIR = support_df.PIR.astype(float)
support_ranks = support_df.sort_values('PIR')
sns.set(rc={'figure.figsize':(25,8.27)})
sns.barplot(data=support_ranks, x="player", y="PIR")

<AxesSubplot:xlabel='player', ylabel='PIR'>


# Average each teams PIR and store it into a new list
tank_pir_group = tank_df.groupby('team')['PIR'].mean()
damage_pir_group = damage_df.groupby('team')['PIR'].mean()
support_pir_group = support_df.groupby('team')['PIR'].mean()


# Create temp arrays to store info for tank, damage, support, combined
team_list = playoffs.team.unique()
temp_tank = []
temp_damage = []
temp_support = []
temp_all = []

for t in team_list:
    temp_tank.append([t, tank_pir_group[t]])
    temp_damage.append([t, damage_pir_group[t]])
    temp_support.append([t, support_pir_group[t]])
    temp_all.append([t, (tank_pir_group[t] + damage_pir_group[t] + support_pir_group[t]) / 3])
    
#Create four new dataframes with column values Team and Team_PIR
tank_team_ranks = pd.DataFrame(temp_tank, columns = ['team', 'team_PIR'])
damage_team_ranks = pd.DataFrame(temp_damage, columns = ['team', 'team_PIR'])
support_team_ranks = pd.DataFrame(temp_support, columns = ['team', 'team_PIR'])
all_team_ranks = pd.DataFrame(temp_all, columns = ['team', 'team_PIR'])


# Sort values in each dataframe
tank_team_ranks = tank_team_ranks.sort_values('team_PIR', ascending=False)
damage_team_ranks = damage_team_ranks.sort_values('team_PIR', ascending=False)
support_team_ranks = support_team_ranks.sort_values('team_PIR', ascending=False)
all_team_ranks = all_team_ranks.sort_values('team_PIR', ascending=False)


# Label each team with their actual final standing position in the OWL 2019 playoffs
def label_result (row):
    if row['team'] == 'Chengdu Hunters':
        return 12
    if row['team'] == 'Philadelphia Fusion':
        return 11
    if row['team'] == 'Shanghai Dragons':
        return 10
    if row['team'] == 'Guangzhou Charge':
        return 9
    if row['team'] == 'London Spitfire':
        return 8
    if row['team'] == 'Seoul Dynasty':
        return 7
    if row['team'] == 'Los Angeles Gladiators':
        return 6
    if row['team'] == 'Atlanta Reign':
        return 5
    if row['team'] == 'Hangzhou Spark':
        return 4
    if row['team'] == 'New York Excelsior':
        return 3
    if row['team'] == 'Vancouver Titans':
        return 2
    if row['team'] == 'San Francisco Shock':
        return 1
    return 0

# Create new column to store actual standings of OWL teams
tank_team_ranks['standing'] = tank_team_ranks.apply(lambda row: label_result(row), axis=1)
damage_team_ranks['standing'] = damage_team_ranks.apply(lambda row: label_result(row), axis=1)
support_team_ranks['standing'] = support_team_ranks.apply(lambda row: label_result(row), axis=1)
all_team_ranks['standing'] = all_team_ranks.apply(lambda row: label_result(row), axis=1)


# Provide names to each for data viewing. Go through RSS for each tank, damage, and support PIR predictions. 
tank_team_ranks.name = 'tanks'
damage_team_ranks.name = 'damage'
support_team_ranks.name = 'supports'
all_team_ranks.name = 'all'
RSS = []

# Reshape value to fit Regression model
X = tank_team_ranks[['standing']]
y = tank_team_ranks['team_PIR']

# Create polynomial line
poly = PolynomialFeatures(degree=2)
poly_X = poly.fit_transform(X)

# Fit LinearRegression over poly data
poly_model = LinearRegression()
poly_model.fit(poly_X,y)

# Split values into 12 sets and predict
coefs = poly_model.coef_
standings = np.linspace(1, 12, 12).reshape(-1, 1)
poly_standings = poly.fit_transform(standings)
predictions = poly_model.predict(poly_standings)

# Graph Actual Standing to PIR. Provide relevant titles
plt.plot(standings, predictions)
plt.scatter(y=tank_team_ranks['team_PIR'], x=tank_team_ranks['standing'])
plt.title('Standing vs. PIR for Tank')
plt.xlabel('Standing')
plt.ylabel('PIR')
    
RSS.append([tank_team_ranks.name, ((y - predictions)**2).sum()])
    
print('RSS for', tank_team_ranks.name, ' = ',((y - predictions)**2).sum())

RSS for tanks  =  1.2865755991698622


# Reshape value to fit Regression model
X = damage_team_ranks[['standing']]
y = damage_team_ranks['team_PIR']

# Create polynomial line
poly = PolynomialFeatures(degree=2)
poly_X = poly.fit_transform(X)

# Fit LinearRegression over poly data
poly_model = LinearRegression()
poly_model.fit(poly_X,y)

# Split values into 12 sets and predict
coefs = poly_model.coef_
standings = np.linspace(1, 12, 12).reshape(-1, 1)
poly_standings = poly.fit_transform(standings)
predictions = poly_model.predict(poly_standings)

# Graph Actual Standing to PIR. Provide relevant titles
plt.plot(standings, predictions)
plt.scatter(y=damage_team_ranks['team_PIR'], x=damage_team_ranks['standing'])
plt.title('Standing vs. PIR for Damage')
plt.xlabel('Standing')
plt.ylabel('PIR')
    
RSS.append([damage_team_ranks.name, ((y - predictions)**2).sum()])
    
print('RSS for', damage_team_ranks.name, ' = ',((y - predictions)**2).sum())

RSS for damage  =  1.6823208231276627


# Reshape value to fit Regression model
X = support_team_ranks[['standing']]
y = support_team_ranks['team_PIR']

# Create polynomial line
poly = PolynomialFeatures(degree=2)
poly_X = poly.fit_transform(X)

# Fit LinearRegression over poly data
poly_model = LinearRegression()
poly_model.fit(poly_X,y)

# Split values into 12 sets and predict
coefs = poly_model.coef_
standings = np.linspace(1, 12, 12).reshape(-1, 1)
poly_standings = poly.fit_transform(standings)
predictions = poly_model.predict(poly_standings)

# Graph Actual Standing to PIR. Provide relevant titles
plt.plot(standings, predictions)
plt.scatter(y=support_team_ranks['team_PIR'], x=support_team_ranks['standing'])
plt.title('Standing vs. PIR for Support')
plt.xlabel('Standing')
plt.ylabel('PIR')
    
RSS.append([support_team_ranks.name, ((y - predictions)**2).sum()])
    
print('RSS for', support_team_ranks.name, ' = ',((y - predictions)**2).sum())

RSS for supports  =  0.977301972003016


import math 
for elem in RSS:
    RSE = math.sqrt((1/10) * elem[1])
    print('RSE for', elem[0], ' = ', RSE)

RSE for tanks  =  0.3586886671153498
RSE for damage  =  0.4101610443627799
RSE for supports  =  0.3126182931312587


# Reshape value to fit Regression model
X = all_team_ranks[['standing']]
y = all_team_ranks['team_PIR']

# Create polynomial line
poly = PolynomialFeatures(degree=2)
poly_X = poly.fit_transform(X)

# Fit LinearRegression over poly data
poly_model = LinearRegression()
poly_model.fit(poly_X,y)

# Split values into 12 sets and predict
coefs = poly_model.coef_
standings = np.linspace(1, 12, 12).reshape(-1, 1)
poly_standings = poly.fit_transform(standings)
predictions = poly_model.predict(poly_standings)

# Graph Actual Standing to PIR. Provide relevant titles
plt.plot(standings, predictions)
plt.scatter(y=all_team_ranks['team_PIR'], x=all_team_ranks['standing'])
plt.title('Standing vs. PIR for All Roles')
plt.xlabel('Standing')
plt.ylabel('PIR')

RSS = ((y - predictions)**2).sum()
    
print('RSS for all = ', RSS)
print('RSE for all = ', math.sqrt((1/10) * RSS))

RSS for all =  1.155814060890623
RSE for all =  0.33997265491368905

	start_time	match_id	stage	map_type	map_name	player	team	stat_name	hero	stat_amount
0	8/31/2019 1:09	30172	Overwatch League 2019 Post-Season	CONTROL	Ilios	Elsa	Chengdu Hunters	All Damage Done	All Heroes	19059.670270
1	8/31/2019 1:09	30172	Overwatch League 2019 Post-Season	CONTROL	Ilios	Elsa	Chengdu Hunters	Assists	All Heroes	22.000000
2	8/31/2019 1:09	30172	Overwatch League 2019 Post-Season	CONTROL	Ilios	Elsa	Chengdu Hunters	Average Time Alive	All Heroes	302.704223
3	8/31/2019 1:09	30172	Overwatch League 2019 Post-Season	CONTROL	Ilios	Elsa	Chengdu Hunters	Barrier Damage Done	All Heroes	8861.540116
4	8/31/2019 1:09	30172	Overwatch League 2019 Post-Season	CONTROL	Ilios	Elsa	Chengdu Hunters	Damage - Quick Melee	All Heroes	152.999995

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_blocked	damage_taken	healing_done
0	Elsa	tank	Chengdu Hunters	3498.163487	90.0	35.0	54.0	35.0	78813.946835	35643.738028	71868.736370	58973.418665	0.000000
1	JinMu	damage	Chengdu Hunters	3498.163487	95.0	60.0	34.0	50.0	89472.716591	43849.816894	0.000000	30350.028669	0.000000
2	Kyo	support	Chengdu Hunters	3498.163487	98.0	24.0	74.0	31.0	38001.950358	26834.042363	0.000000	22157.011539	64119.250791
3	YangXiaoLong	damage	Chengdu Hunters	3498.163487	82.0	24.0	58.0	50.0	78420.876844	32839.213115	9014.902748	27648.442155	0.000000
4	Yveltal	support	Chengdu Hunters	3498.163487	33.0	12.0	20.0	35.0	13237.696258	7500.577831	0.000000	19125.635731	49803.365637

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_blocked	damage_taken	healing_done
0	Elsa	tank	Chengdu Hunters	3498.163487	15.436671	6.003150	9.262003	6.003150	13518.055480	6113.562986	12326.822911	10115.036455	0.000000
1	JinMu	damage	Chengdu Hunters	3498.163487	16.294264	10.291114	5.831631	8.575929	15346.232430	7521.057901	0.000000	5205.593526	0.000000
2	Kyo	support	Chengdu Hunters	3498.163487	16.808820	4.116446	12.692374	5.317076	6518.040194	4602.536581	0.000000	3800.338941	10997.642224
3	YangXiaoLong	damage	Chengdu Hunters	3498.163487	14.064523	4.116446	9.948077	8.575929	13450.636678	5632.534883	1546.223231	4742.221269	0.000000
4	Yveltal	support	Chengdu Hunters	3498.163487	5.660113	2.058223	3.430371	6.003150	2270.510736	1286.488386	0.000000	3280.401697	8542.202070

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_blocked	damage_taken	healing_done
0	Elsa	tank	Chengdu Hunters	3498.163487	15.436671	6.003150	9.262003	6.003150	13518.055480	6113.562986	12326.822911	10115.036455	0.000000
1	JinMu	damage	Chengdu Hunters	3498.163487	16.294264	10.291114	5.831631	8.575929	15346.232430	7521.057901	0.000000	5205.593526	0.000000
2	Kyo	support	Chengdu Hunters	3498.163487	16.808820	4.116446	12.692374	5.317076	6518.040194	4602.536581	0.000000	3800.338941	10997.642224
3	YangXiaoLong	damage	Chengdu Hunters	3498.163487	14.064523	4.116446	9.948077	8.575929	13450.636678	5632.534883	1546.223231	4742.221269	0.000000
4	Yveltal	support	Chengdu Hunters	3498.163487	5.660113	2.058223	3.430371	6.003150	2270.510736	1286.488386	0.000000	3280.401697	8542.202070
...	...	...	...	...	...	...	...	...	...	...	...	...	...
76	sinatraa	damage	San Francisco Shock	17413.605518	23.223220	11.232596	11.990624	6.305414	13480.414974	8509.802416	154.843549	7222.756482	2.238924
77	smurf	tank	San Francisco Shock	22202.566157	21.997457	4.675135	17.295298	5.918235	15793.131129	5812.403495	20423.271692	9838.326945	0.000000
78	Rascal	damage	San Francisco Shock	6211.166533	24.053453	8.404218	15.552634	5.409612	17039.293828	8715.729860	4856.452063	5541.179793	0.000000
79	NUS	support	London Spitfire	3393.073868	7.073232	1.591477	5.304924	5.481755	4515.641492	1565.947588	0.000000	3173.376017	8560.525761
80	Architect	damage	San Francisco Shock	6186.786785	22.984468	12.122609	10.861858	4.655082	32841.269373	8755.993527	0.000000	6937.621188	0.000000

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_blocked	damage_taken
0	Elsa	tank	Chengdu Hunters	3498.163487	15.436671	6.003150	9.262003	6.003150	13518.055480	6113.562986	12326.822911	10115.036455
5	ameng	tank	Chengdu Hunters	3498.163487	12.520856	1.372149	10.977188	8.232891	11551.170264	4740.750125	13979.642293	10826.026007
8	HOTBA	tank	Guangzhou Charge	8551.738904	20.416900	6.524989	13.821750	4.700798	18664.522404	10178.403621	15039.548751	8212.293321
9	Rio	tank	Guangzhou Charge	8551.738904	15.996747	3.016930	12.979816	5.823377	13930.162221	4611.205186	22859.774330	8461.234009
14	Poko	tank	Philadelphia Fusion	6457.880113	18.117400	6.132043	11.985357	4.273848	17116.883495	7250.029507	18319.923811	7227.170814

Predicting Overwatch League Rankings with statistics¶

Leo Fafoutis¶

Introduction¶

Data Collection¶

Data Management¶

Data Analysis¶

Tanks¶

Damage¶

Support¶

Hypothesis Testing¶

Communication of Insights¶

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_blocked	damage_taken	expected_elims	damage_eff
1	JinMu	damage	Chengdu Hunters	3498.163487	0.298727	0.771239	0.007644	1.000000	0.235032	0.479698	0.000000	0.109243	25.845560	0.679184
3	YangXiaoLong	damage	Chengdu Hunters	3498.163487	0.128688	0.000000	0.427866	1.000000	0.152147	0.000000	0.256597	0.004824	19.355790	0.419691
7	Eileen	damage	Guangzhou Charge	8551.738904	0.532861	0.800350	0.300456	0.799013	0.071850	0.430174	0.000000	0.406840	25.175553	0.325607
10	nero	damage	Guangzhou Charge	5982.105991	0.624131	0.663448	0.528370	0.245271	0.238240	0.781765	0.000000	0.064723	29.932177	0.517992
12	Happy	damage	Guangzhou Charge	2569.632913	0.605285	0.506601	0.651811	0.182444	0.242571	0.285673	0.000000	0.198603	23.220626	0.131551

	player	role	team	time_played	eliminations	final_blows	assists	deaths	all_damage_done	hero_damage_done	damage_taken	healing_done
2	Kyo	support	Chengdu Hunters	3498.163487	0.614356	0.956099	0.535122	0.546948	0.540506	0.539765	0.794325	0.535692
4	Yveltal	support	Chengdu Hunters	3498.163487	0.161790	0.403061	0.106970	0.843313	0.123519	0.110728	0.508308	0.308725
6	Chara	support	Guangzhou Charge	8551.738904	0.282342	0.170508	0.282457	0.492887	0.494997	0.236940	0.531907	0.193884
11	shu	support	Guangzhou Charge	8551.738904	0.644049	1.000000	0.561383	0.280733	0.635123	0.588588	0.434874	0.569629
13	Boombox	support	Philadelphia Fusion	6457.880113	0.742907	0.748747	0.717184	0.296975	0.693041	0.660875	0.438454	0.570349