import pandas as pd
import seaborn as sns
from matplotlib import pyplot as plt
import scipy.stats as stats
import statsmodels.formula.api as sm
import random

names = pd.read_csv("CKC_Names.8.31.2024.csv")
scores = pd.read_csv("CKC_Ratings.8.31.2024.csv")
ratings = pd.merge(scores, names, "left", left_on = "Pizza ID", right_on = "ID")
ratings.rename(columns={"Name" : "Pizzeria"}, inplace = True)
ratings_output = ratings[["Judge", "Score", "Pizzeria"]].copy()
output = ratings_output.pivot(index = "Pizzeria", columns = "Judge", values = "Score")
display(output)

ratings_norm = pd.DataFrame()
for judge in ratings["Judge"].unique():
    temp = ratings[ratings["Judge"] == judge].copy()
    max = temp["Score"].max()
    min = temp["Score"].min()
    temp["Score"] = round(100 / (max - min) * (temp["Score"] - min), 2)
    ratings_norm = pd.concat([ratings_norm, temp])
ratings_output = ratings_norm[["Judge", "Score", "Pizzeria"]].copy()
output = ratings_output.pivot(index = "Pizzeria", columns = "Judge", values = "Score").astype(int)
display(output)

ax = sns.barplot(ratings.groupby("Judge")["Score"].sum().sort_values(), ec = "black")
ax.bar_label(ax.containers[0])
plt.title("Total Raw Score by Judge")
plt.xticks(fontsize = 9)
display()

ax = sns.barplot(ratings_norm.groupby("Judge")["Score"].sum().astype(int).sort_values(), ec = "black")
ax.bar_label(ax.containers[0])
plt.title("Total Normalized Score by Judge")
plt.xticks(fontsize = 9)
display()

sns.boxplot(data = ratings.sort_values("Judge"), x = "Judge", y = "Score")
ax.bar_label(ax.containers[0])
plt.title("Raw Score Distribution by Judge")
plt.xticks(fontsize = 9)
display()

sns.boxplot(data = ratings_norm.sort_values("Judge"), x = "Judge", y = "Score")
ax.bar_label(ax.containers[0])
plt.title("Normalized Score Distribution by Judge")
plt.xticks(fontsize = 9)
display()

final_results = pd.DataFrame(ratings["Pizzeria"].drop_duplicates())

results = ratings.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Average Raw Scores")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 20])
display()

text = "Raw Average"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

results = ratings_norm.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt= "%.1f")
plt.title("Average Normalized Scores")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 100])
display()

text = "Norm Average"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

results = ratings.groupby("Pizzeria")["Score"].median().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Median Raw Scores")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 20])
display()

text = "Raw Median"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

results = ratings_norm.groupby("Pizzeria")["Score"].median().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt= "%.1f")
plt.title("Median Normalized Scores")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 100])
display()

text = "Norm Median"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

temp = ratings.copy()

g = ratings.groupby(['Pizzeria'])['Score'].transform('max')
temp = temp[~(temp['Score'] == g)]

g = temp.groupby(['Pizzeria'])['Score'].transform('min')
temp = temp[~(temp['Score'] == g)]

results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Average Raw Scores Minus BestWorst")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 20])
display()

text = "Raw Average MBW"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

temp = ratings_norm.copy()

g = ratings.groupby(['Pizzeria'])['Score'].transform('max')
temp = temp[~(temp['Score'] == g)]

g = temp.groupby(['Pizzeria'])['Score'].transform('min')
temp = temp[~(temp['Score'] == g)]

results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Average Normalized Scores Minus BestWorst")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 100])
display()

text = "Norm Average MBW"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

temp = ratings.copy()

g = ratings.groupby(['Pizzeria'])['Score'].transform('max')
temp = temp[~(temp['Score'] == g)]

g = temp.groupby(['Pizzeria'])['Score'].transform('min')
temp = temp[~(temp['Score'] == g)]

results = temp.groupby("Pizzeria")["Score"].median().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Median Raw Scores Minus BestWorst")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 20])
display()

text = "Raw Median MBW"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

temp = ratings_norm.copy()

g = ratings.groupby(['Pizzeria'])['Score'].transform('max')
temp = temp[~(temp['Score'] == g)]

g = temp.groupby(['Pizzeria'])['Score'].transform('min')
temp = temp[~(temp['Score'] == g)]

results = temp.groupby("Pizzeria")["Score"].median().sort_values(ascending = False).reset_index()
ax = sns.barplot(results, x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt = "%.1f")
plt.title("Median Normalized Scores Minus BestWorst")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 100])
display()

text = "Normalized Median MBW"
results[text] = results["Score"].rank(ascending = False)
final_results = pd.merge(left = final_results, right = results[["Pizzeria", text]], left_on = "Pizzeria", right_on = "Pizzeria")

aggregate_results = pd.DataFrame()
for i in range (3, 10):
    temp = ratings.copy()
    temp = temp.groupby('Pizzeria')['Score'].nlargest(i).reset_index(level = 1, drop = True).reset_index()
    results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
    results = results.rename(columns = {"Score" : f'{i} Best Raw'})
    for col in results.columns:
        if col != "Pizzeria":
            results[col] = results[col].rank(method = 'dense', ascending = False).astype(int)
    try:
        aggregate_results = pd.merge(left = aggregate_results, right = results, left_on = "Pizzeria", right_on = "Pizzeria")
    except:
        aggregate_results = results
display(aggregate_results)

final_results = pd.merge(left = final_results, right = aggregate_results, left_on = "Pizzeria", right_on = "Pizzeria")

aggregate_results = pd.DataFrame()
for i in range (3, 10):
    temp = ratings_norm.copy()
    temp = temp.groupby('Pizzeria')['Score'].nlargest(i).reset_index(level = 1, drop = True).reset_index()
    results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
    results = results.rename(columns = {"Score" : f'{i} Best Normalized'})
    for col in results.columns:
        if col != "Pizzeria":
            results[col] = results[col].rank(method = 'dense', ascending = False).astype(int)
    try:
        aggregate_results = pd.merge(left = aggregate_results, right = results, left_on = "Pizzeria", right_on = "Pizzeria")
    except:
        aggregate_results = results
display(aggregate_results)

final_results = pd.merge(left = final_results, right = aggregate_results, left_on = "Pizzeria", right_on = "Pizzeria")

aggregate_results = pd.DataFrame()
for i in range (3, 10):
    temp = ratings.copy()
    temp = temp.groupby('Pizzeria')['Score'].nsmallest(i).reset_index(level = 1, drop = True).reset_index()
    results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
    results = results.rename(columns = {"Score" : f'{i} Worst Raw'})
    for col in results.columns:
        if col != "Pizzeria":
            results[col] = results[col].rank(method = 'dense', ascending = False).astype(int)
    try:
        aggregate_results = pd.merge(left = aggregate_results, right = results, left_on = "Pizzeria", right_on = "Pizzeria")
    except:
        aggregate_results = results
display(aggregate_results)

final_results = pd.merge(left = final_results, right = aggregate_results, left_on = "Pizzeria", right_on = "Pizzeria")

aggregate_results = pd.DataFrame()
for i in range (3, 10):
    temp = ratings_norm.copy()
    temp = temp.groupby('Pizzeria')['Score'].nsmallest(i).reset_index(level = 1, drop = True).reset_index()
    results = temp.groupby("Pizzeria")["Score"].mean().sort_values(ascending = False).reset_index()
    results = results.rename(columns = {"Score" : f'{i} Worst Normalized'})
    for col in results.columns:
        if col != "Pizzeria":
            results[col] = results[col].rank(method = 'dense', ascending = False).astype(int)
    try:
        aggregate_results = pd.merge(left = aggregate_results, right = results, left_on = "Pizzeria", right_on = "Pizzeria")
    except:
        aggregate_results = results
display(aggregate_results)

final_results = pd.merge(left = final_results, right = aggregate_results, left_on = "Pizzeria", right_on = "Pizzeria")

results = final_results.copy()

results.index = results["Pizzeria"]
results.drop("Pizzeria", axis = 1, inplace = True)
results = len(results.index.unique()) + 1 - results
results["Score"] = results.sum(axis = 1)
results = results[["Score"]].copy()
results['Score'] = ((results['Score'] - results['Score'].min()) / (results['Score'].max() - results['Score'].min())) * 100

ax = sns.barplot(results.sort_values("Score", ascending = False), x = "Pizzeria", y = "Score", ec = "black")
ax.bar_label(ax.containers[0], fmt= "%.1f")
plt.title("Final Scores of the 2024 CKC Pizza Rating Festival")
plt.xticks(fontsize = 8, rotation = 45)
plt.ylim([0, 105])
display()

pizza_ranks = results["Score"].copy()
pizza_orders = ratings[["Pizzeria", "Pizza ID"]].copy()
pizza_orders.index = pizza_orders["Pizzeria"]
pizza_orders.drop("Pizzeria", axis = 1, inplace = True)
pizza_orders = pizza_orders["Pizza ID"].copy()

pizza_data = pd.merge(pizza_orders, pizza_ranks, left_on = "Pizzeria", right_on = "Pizzeria")
sns.scatterplot(data = pizza_data, x = "Pizza ID", y = "Score")
plt.title("Final Scores for Pizzerias by Order in Tasting Lineup")

def label_point(x, y, val, ax):
    a = pd.concat({'x': x, 'y': y, 'val': val}, axis=1)
    for i, point in a.iterrows():
        ax.text(point['x']+0.1, point['y'] - 5, str(point['val']), fontsize = 9)

label_point(pizza_data["Pizza ID"], pizza_data["Score"], pizza_data.index.to_series(), plt.gca()) 

display()

first_half = pizza_data[pizza_data["Pizza ID"] <= 6]["Score"].copy()
second_half = pizza_data[pizza_data["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.ttest_ind(first_half, second_half)
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 1.5328059077494744
P-value: 0.1277537008396266

first_half = ratings[ratings["Pizza ID"] <= 6]["Score"].copy()
second_half = ratings[ratings["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.ttest_ind(first_half, second_half)
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 0.39358413005468457
P-value: 0.6945328720113341

first_half = ratings_norm[ratings_norm["Pizza ID"] <= 6]["Score"].copy()
second_half = ratings_norm[ratings_norm["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.ttest_ind(first_half, second_half)
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 0.7516878960838435
P-value: 0.4535974942323605

first_half = pizza_data[pizza_data["Pizza ID"] <= 6]["Score"].copy()
second_half = pizza_data[pizza_data["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.mannwhitneyu(first_half, second_half, method="exact")
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 2541.0
P-value: 0.09909440016666508

first_half = ratings[ratings["Pizza ID"] <= 6]["Score"].copy()
second_half = ratings[ratings["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.mannwhitneyu(first_half, second_half, method="exact")
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 2292.0
P-value: 0.606593148588398

first_half = ratings_norm[ratings_norm["Pizza ID"] <= 6]["Score"].copy()
second_half = ratings_norm[ratings_norm["Pizza ID"] > 6]["Score"].copy()

t_stat, p_value = stats.mannwhitneyu(first_half, second_half, method="exact")
print("T-statistic:", t_stat)
print("P-value:", p_value)

T-statistic: 2340.0
P-value: 0.46359335005995844

ratings.rename({"Pizza ID": "ID"})
result = sm.ols(formula="Score ~ ID", data=ratings).fit()
print(result.summary())

                            OLS Regression Results                            
==============================================================================
Dep. Variable:                  Score   R-squared:                       0.006
Model:                            OLS   Adj. R-squared:                 -0.002
Method:                 Least Squares   F-statistic:                    0.7307
Date:                Sun, 24 Nov 2024   Prob (F-statistic):              0.394
Time:                        10:44:27   Log-Likelihood:                -351.14
No. Observations:                 132   AIC:                             706.3
Df Residuals:                     130   BIC:                             712.0
Df Model:                           1                                         
Covariance Type:            nonrobust                                         
==============================================================================
                 coef    std err          t      P>|t|      [0.025      0.975]
------------------------------------------------------------------------------
Intercept     13.9566      0.647     21.573      0.000      12.677      15.237
ID            -0.0751      0.088     -0.855      0.394      -0.249       0.099
==============================================================================
Omnibus:                        7.375   Durbin-Watson:                   1.563
Prob(Omnibus):                  0.025   Jarque-Bera (JB):                7.629
Skew:                          -0.587   Prob(JB):                       0.0221
Kurtosis:                       2.915   Cond. No.                         15.9
==============================================================================

Notes:
[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.

ratings_norm.rename({"Pizza ID": "ID"})
result = sm.ols(formula="Score ~ ID", data=ratings_norm).fit()
print(result.summary())

                            OLS Regression Results                            
==============================================================================
Dep. Variable:                  Score   R-squared:                       0.016
Model:                            OLS   Adj. R-squared:                  0.008
Method:                 Least Squares   F-statistic:                     2.120
Date:                Sun, 24 Nov 2024   Prob (F-statistic):              0.148
Time:                        10:44:31   Log-Likelihood:                -642.89
No. Observations:                 132   AIC:                             1290.
Df Residuals:                     130   BIC:                             1296.
Df Model:                           1                                         
Covariance Type:            nonrobust                                         
==============================================================================
                 coef    std err          t      P>|t|      [0.025      0.975]
------------------------------------------------------------------------------
Intercept     62.7568      5.899     10.639      0.000      51.087      74.427
ID            -1.1670      0.801     -1.456      0.148      -2.753       0.419
==============================================================================
Omnibus:                       32.406   Durbin-Watson:                   1.851
Prob(Omnibus):                  0.000   Jarque-Bera (JB):                8.019
Skew:                          -0.253   Prob(JB):                       0.0181
Kurtosis:                       1.904   Cond. No.                         15.9
==============================================================================

Notes:
[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.

Judge	Ben	Billy	Erica	Jack	Jim	Joe	Kelly	Kristi	Maddie	Mike	Sharon
Pizzeria
Angeloni's	14.2	11.0	12.0	13.4	13.0	8.0	7.0	11.0	9.5	15.2	9.0
Calibria	18.0	11.5	14.5	16.0	17.0	16.0	13.0	6.0	14.5	12.2	20.0
Di Fara	11.4	14.5	18.0	18.6	9.0	18.0	17.0	9.0	14.5	14.4	15.0
Est Est Est	18.2	16.0	17.5	16.4	18.0	16.0	19.0	11.0	15.0	14.6	18.0
Frank Pepe	13.8	14.0	10.0	17.6	17.0	18.0	15.0	9.0	12.0	13.2	14.0
Fuoco	13.6	17.0	9.0	17.4	18.0	13.0	4.0	11.0	13.0	16.4	4.0
L&B	17.6	16.5	18.0	17.0	13.0	14.0	12.0	13.0	14.5	13.6	14.0
Luigi's 4704	16.2	12.5	12.5	16.8	16.0	17.0	17.0	11.0	13.5	15.6	17.0
Luigi's 686	12.8	14.0	14.5	11.8	11.0	10.0	12.0	7.0	10.0	13.8	16.0
Luna	12.8	13.5	16.0	12.6	16.0	15.0	9.0	9.0	10.0	14.8	14.0
Tony D	16.4	19.0	7.0	12.2	17.0	16.0	9.0	9.0	11.0	15.8	13.0
Zeneli	10.4	13.0	17.0	15.8	10.0	7.0	10.0	5.0	11.0	13.2	5.0

CKC Pizza Festival 2024

Table of Contents¶

Background

The History

The Pizza

The Judges

Logistics

The Data

Raw Scores

Normalized Scores

Judges Behavior

Total Scores

Score Distributions

Evaluating the Winner

Eliminating Bias

Scoring Method #1: Average

Raw Scores¶

Normalized Scores¶

Scoring Method #2: Median

Raw Scores¶

Normalized Scores¶

Scoring Method #3 - Average Minus BestWorst

Raw Scores¶

Normalized Scores¶

Scoring Method #4: Raw Median Minus BestWorst

Raw Scores¶

Normalized Scores¶

Scoring Method #5: Average N Best Judges

Raw Scores¶

Normalized Scores¶

Scoring Method #6: Average N Worst Judges

Raw Scores¶

Normalized Scores¶

Final Results

Standings

Testing For Bias

Categorical Statistical Tests¶

T-Tests¶

Final Scores¶

All Raw Scores¶

All Normalized Scores¶

Mann-Whitney U Tests¶

Final Scores¶

All Raw Scores¶

All Normalized Scores¶

Linear Regression Model¶

Raw Scores¶

Normalized Scores¶