from web3 import Web3
import json
import requests
import csv
import pandas as pd
import seaborn as sns 
import numpy as np
import matplotlib.pyplot as plt
from time import *
import plotly.express as px
import plotly.io as pio
pd.options.plotting.backend = "plotly"
pio.renderers.default = "plotly_mimetype+notebook_connected"
import plotly.graph_objects as go
import math
import warnings


attestor_slashing = {}
proposer_slashing = {}
proposed_block_count = {}
global_participation_rate = {}
exit_counts = {}
deposits = {}
attestation_count = {}
orphaned_blocks = {}


# with open('api_key.txt', 'r') as api_file:
#     api_key = api_file.read()

for epoch in range(58500,59560):
    x = requests.get('https://beaconcha.in/api/v1/epoch/{}?api_key={}'.format(epoch, api_key))
    #Add a sleep to stay within the call rate limits
    sleep(6)
    
    data = x.json()['data']
    
    attestor_slashing[epoch] = data['attesterslashingscount']
    proposer_slashing[epoch] = data['proposerslashingscount']
    proposed_block_count[epoch] = data['proposedblocks']
    global_participation_rate[epoch] = data['globalparticipationrate']
    exit_counts[epoch] = data['voluntaryexitscount']
    deposits[epoch] = data['depositscount']
    attestation_count[epoch] = data['attestationscount']
    orphaned_blocks[epoch] = data['orphanedblocks']


#Writing the dictionaries to csv files

with open('attestor_slashing.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in attestor_slashing.items():
        wr.writerow([key,value])
        
with open('proposer_slashing.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in proposer_slashing.items():
        wr.writerow([key,value])
        
with open('proposed_block_count.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in proposed_block_count.items():
        wr.writerow([key,value])
        
with open('global_participation_rate.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in global_participation_rate.items():
        wr.writerow([key,value])
        
with open('exit_counts.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in exit_counts.items():
        wr.writerow([key,value])
        
with open('deposits.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in deposits.items():
        wr.writerow([key,value])
        
with open('attestation_count.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in attestation_count.items():
        wr.writerow([key,value])
        
with open('orphaned_blocks.csv','w') as result_file:
    wr = csv.writer(result_file, dialect='excel')
    for key, value in orphaned_blocks.items():
        wr.writerow([key,value])


files = ["attestor_slashing", "proposer_slashing", "proposed_block_count", "global_participation_rate", "exit_counts", "deposits", "attestation_count", "orphaned_blocks"]
dfs = []

for file in files:
    df = pd.read_csv(f"{file}.csv", header=None, names=["epoch", file])
    df.dropna(subset=["epoch"], inplace=True)
    dfs += [df[[file]]] # We don't want the epoch column

df = pd.concat([df[["epoch"]]] + dfs, axis=1) # Concat everything, with the epoch column first
df["global_participation_rate"] *= 100 # Set to percentages
df = df[df.epoch < max(df["epoch"])] # Remove last epoch (queried too soon)
df["epoch"] = df["epoch"].astype(int)
df


fig = px.area(df, x="epoch", y="attestation_count", title='Attestation Count', labels = {'epoch': 'Epoch', 'attestation_count': 'Attestation Count'})
fig.show()


bucket_size = 200
df["bucket"] = np.floor_divide(df["epoch"], bucket_size)
df["n_bxs"] = 1
df_bucket = df[["bucket", "orphaned_blocks", "n_bxs"]].groupby(["bucket", "orphaned_blocks"]).sum("n_bxs").reset_index()
df_bucket["epoch"] = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)

fig = px.scatter(df_bucket, x = 'epoch', y = 'orphaned_blocks', size = 'n_bxs',
                 labels={ "orphaned_blocks": "Number of Orphaned Blocks", "epoch": "Epoch", "n_bxs": "Count" },
                 title = f"Ophaned Blocks count in intervals of {bucket_size} Epochs")
fig


bucket_size = 100
df["bucket"] = np.floor_divide(df["epoch"], bucket_size)
df["n_bxs"] = 1
bins = pd.IntervalIndex.from_tuples([(i,i+1) for i in range(int(min(df["global_participation_rate"])), 100)][::-1])
df["participation_bin"] = pd.cut(df["global_participation_rate"], bins)
df_bucket = df[["bucket", "participation_bin", "n_bxs"]].groupby(["bucket", "participation_bin"]).sum("n_bxs").reset_index()
epoch_names = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)
df_bucket["epoch"] = epoch_names
df_bucket = df_bucket[["participation_bin", "n_bxs", "epoch"]].pivot(index="participation_bin", columns=["epoch"])

px.imshow(
    df_bucket.to_numpy(),
    labels=dict(x="Epochs", y="Participation rate", color="Frequency"),
    x = sorted(list(set(epoch_names))),
    y = [str(s) for s in np.flip(np.arange(int(min(df["global_participation_rate"])), 100))],
    color_continuous_scale='blues'
)


rng = np.random.default_rng(42)
df['temp'] = rng.uniform(0, 10, len(df["epoch"]))
fig = px.scatter(
    df[df.attestor_slashing > 0], x = 'epoch', y = 'temp', size = 'attestor_slashing',
    size_max = 20, labels = {"epoch": "Epoch"},
    title = f"Attester slashings"
)
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


fig = px.scatter(
    df[df.proposer_slashing > 0], x = 'epoch', y = 'temp', size = 'proposer_slashing',
    size_max = 20, labels = {"epoch": "Epoch"},
    title = f"Proposer slashings"
)
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


px.line(x=df['epoch'], y=df['exit_counts'], labels = {"x": "Epoch", "y": "Number of exits"}, title = "Number of voluntary exits")


names = ['Validator Index', 'Attestation Efficiency']
df1 = pd.read_csv('lido_effectiveness_0809.csv', header = None, names = names)


names = ['Validator Index', 'Attestation Efficiency']
df2 = pd.read_csv('lido_effectiveness_0823.csv', header = None, names = names)


nan_value = float("NaN")
df2.replace("", nan_value, inplace=True)
df2.dropna(subset = ["Validator Index"], inplace=True)
df2.reset_index()


print("Summary stats of efficiency before the incident")
df1['Attestation Efficiency'].describe()

Summary stats of efficiency before the incident

count    591.000000
mean       0.993807
std        0.013123
min        0.916667
25%        0.990099
50%        1.000000
75%        1.000000
max        1.000000
Name: Attestation Efficiency, dtype: float64


print("Summary stats of efficiency after the incident")
df2['Attestation Efficiency'].describe()

Summary stats of efficiency after the incident

count    591.000000
mean       0.992666
std        0.017333
min        0.847458
25%        1.000000
50%        1.000000
75%        1.000000
max        1.000000
Name: Attestation Efficiency, dtype: float64


from plotly.subplots import make_subplots
fig = make_subplots(rows=2, cols=1)

fig.append_trace(go.Violin(
    name = 'Before',
    x= df1['Attestation Efficiency']
), row=1, col=1)

fig.append_trace(go.Violin(
    name = 'After',
    x=df2['Attestation Efficiency'],
), row=2, col=1)

fig.update_layout(height=600, width=600, title_text="Attestation efficiency of 590 random Lido validators before and after the incident")
fig.update_xaxes(range=[0.84, 1])
fig.update_xaxes(range=[0.84, 1.01])
fig.show()


x = requests.get('https://beaconcha.in/api/v1/validator/stats/96325?api_key={}'.format(api_key))
data = x.json()['data']
earnings_dict = {}

for i in data:
    earnings_dict[i['day'] - 261] = i['end_balance'] - i['start_balance']


df_earnings = pd.DataFrame(list(earnings_dict.items()),columns = ['Days since incident','Earnings'])


fig = px.area(df_earnings, x="Days since incident", y="Earnings", title='Earnings of validator #96325,')
fig.update_xaxes(range=[-15, 2])
fig.update_yaxes(range=[5000000, 7000000])
fig.show()

	epoch	attestor_slashing	proposer_slashing	proposed_block_count	global_participation_rate	exit_counts	deposits	attestation_count	orphaned_blocks
0	58500	0	0	32	97.931033	0	0	3397	0
1	58501	0	0	32	96.418118	0	0	3272	0
2	58502	0	0	31	98.627383	0	0	3458	0
3	58503	0	0	32	99.394751	0	0	2817	0
4	58504	0	0	32	99.045461	0	0	2870	0
...	...	...	...	...	...	...	...	...	...
1054	59554	0	0	31	98.328453	0	54	3715	0
1055	59555	0	0	32	97.735530	0	0	3347	0
1056	59556	0	0	31	97.726738	0	0	3448	0
1057	59557	0	0	32	99.317855	0	0	2942	0
1058	59558	0	0	32	97.957760	0	0	3035	0

Housekeeping - data collection¶

Directly impacted metrics¶

Attestation count¶

Number of orphaned blocks¶

Global participation rate¶

Other metrics¶

Validator slashing incidents¶

Attester slashing¶

Proposer slashing¶

Exit counts¶

Lido performance¶

Attestation efficiency¶

Validator earnings¶

Conclusion¶