#Import all the modules 

import requests
import json
import csv
import pandas as pd
import seaborn as sns 
import numpy as np
import matplotlib.pyplot as plt
from time import *
import plotly.express as px
import plotly.io as pio
pd.options.plotting.backend = "plotly"
pio.renderers.default = "plotly_mimetype+notebook_connected"
import plotly.graph_objects as go
import math


# validator_staking = {}

# with open('api_key.txt', 'r') as api_file:
#     api_key = api_file.read()

# for i in range(0,163399,100):
#     str1 = ''

#     for j in range(99):
#         str1 = str1 + str(i+j) + ','
    
#     str1 = str1 + str(i+99)
    
#     x = requests.get('https://beaconcha.in/api/v1/validator/{}/deposits?api_key={}'.format(str1, api_key))
#     #Add a sleep to stay within the call rate limits
#     sleep(6)
    
#     data = x.json()['data']
    
#     for t in data:
#         if(validator_staking.get(t['from_address']) != None):
#             validator_staking[t['from_address']] += t['amount']
#         else:
#             validator_staking[t['from_address']] = t['amount']


# with open('api_key.txt', 'r') as api_file:
#     api_key = api_file.read()
    
# x = requests.get('https://beaconcha.in/api/v1/validator/{}/deposits?api_key={}'.format(163400, api_key))
# t = x.json()['data']
# if(validator_staking.get(t['from_address']) != None):
#     validator_staking[t['from_address']] += t['amount']
# else:
#     validator_staking[t['from_address']] = t['amount']


# #Writing the dictionaries to csv files

# with open('staking_pools.csv','w') as result_file:
#     wr = csv.writer(result_file, dialect='excel')
#     for key, value in validator_staking.items():
#         wr.writerow([key,value])


df = pd.read_csv('staking_pools.csv', header= None, names = ["address","stake"])
df['percentage_stake'] = (df['stake']/df['stake'].sum())
print(len(df))
print(len(df)/163400)

28934
0.1770746634026928


sorted_df = df.sort_values('percentage_stake',ascending=False)
sorted_df.insert(1, 'ID', range(1, 1 + len(df)))
sorted_df = sorted_df[sorted_df.columns[1:4]]
print(sorted_df.head(n=10))
#print(sorted_df.head(n=6))
#print(13.911047+2.176371+1.582760+1.488614+1.223292+1.050894)

       ID            stake  percentage_stake
3345    1  728160000000000          0.139110
5012    2  113920000000000          0.021764
2479    3   82848000000000          0.015828
9722    4   77920000000000          0.014886
1153    5   64032000000000          0.012233
4824    6   55008000000000          0.010509
601     7   48768000000000          0.009317
5870    8   48736000000000          0.009311
4789    9   45120000000000          0.008620
22874  10   44192000000000          0.008443


ss_index = [0.161317,0.021623,0.015633,0.014690,0.012041,0.010327,0.764370]
resource_percentage = [0.139110,0.021764,0.015828,0.014886,0.012233,0.010509,0.785700]

value_per_unit_resource = []

for i in range(7):
    value_per_unit_resource.append(ss_index[i]/resource_percentage[i])
    
x_axis = [1,2,3,4,5,6,7]


from plotly.subplots import make_subplots
import plotly.graph_objects as go

fig = make_subplots(
    rows=1, cols=2,
    subplot_titles=["Value per unit resource", "Percentage of resource owned by entities"]
)

fig.add_trace(
    go.Scatter(x=x_axis, y=value_per_unit_resource, name="Value per unit resource"),
    row=1, col=1
)

fig.add_trace(
    go.Scatter(x=x_axis, y=[r * 100 for r in resource_percentage], name="Percentage of resource"),
    row=1, col=2
)

fig.update_layout(
    height=500,
    width=1000,
    title_text="Big stakers and the ocean: statistics"   
)
fig.update_xaxes(
    row=1, col=1,
    tickmode="array", tickvals=np.arange(1,8), ticktext=["Largest staker", "2nd largest", "3rd", "4th", "5th", "6th", "Ocean"]
)
fig.update_xaxes(
    row=1, col=2,
    tickmode="array", tickvals=np.arange(1,8), ticktext=["Largest staker", "2nd largest", "3rd", "4th", "5th", "6th", "Ocean"]
)
fig.show()


files = ["attestor_slashing", "proposer_slashing", "block_count", "participation_rate", "exit_count", "deposits"]
dfs = []

for file in files:
    df = pd.read_csv(f"{file}.csv", header=None, names=["epoch", file])
    df.dropna(subset=["epoch"], inplace=True)
    dfs += [df[[file]]] # We don't want the epoch column

df = pd.concat([df[["epoch"]]] + dfs, axis=1) # Concat everything, with the epoch column first
df["participation_rate"] *= 100 # Set to percentages
df = df[df.epoch < max(df["epoch"])] # Remove last epoch (queried too soon)
df["epoch"] = df["epoch"].astype(int)


rng = np.random.default_rng(42)
df['temp'] = rng.uniform(0, 10, len(df["epoch"]))
fig = px.scatter(
    df[df.attestor_slashing > 0], x = 'epoch', y = 'temp', size = 'attestor_slashing',
    size_max = 20, width = 800, height = 400, labels = {"epoch": "Epoch"})
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


fig = px.scatter(
    df[df.proposer_slashing > 0], x = 'epoch', y = 'temp', size = 'proposer_slashing',
    size_max = 20, width = 800, height = 400, labels = {"epoch": "Epoch"})
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


bucket_size = 200
df["bucket"] = np.floor_divide(df["epoch"], bucket_size)
df["n_bxs"] = 1
df_bucket = df[["bucket", "block_count", "n_bxs"]].groupby(["bucket", "block_count"]).sum("n_bxs").reset_index()
df_bucket["epoch"] = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)

fig = px.scatter(df_bucket, x = 'epoch', y = 'block_count', size = 'n_bxs',
                 width=600, height=400, labels={ "block_count": "Blocks produced", "epoch": "Epoch", "n_bxs": "Count" },
                 title = f"Block count in intervals of {bucket_size} epochs")
fig
# fig.update_layout(xaxis=dict(
#     tickmode = 'array',
#     tickvals = df_bucket['epoch'],
#     ticktext = [str(int(s)) for s in df_bucket['epoch']]
# ))


block_freq = df[['block_count']].value_counts(normalize=True).rename_axis('block_count').reset_index(name='freq')
block_freq["freq"] *= 100
px.bar(
    block_freq, x="block_count", y="freq", labels={"block_count": "Blocks per epoch", "freq": "Frequency (%)"},
    width=600, height=400
)


bins = pd.IntervalIndex.from_tuples([(i,i+1) for i in range(int(min(df["participation_rate"])), 100)][::-1])
df["participation_bin"] = pd.cut(df["participation_rate"], bins)
df
df_bucket = df[["bucket", "participation_bin", "n_bxs"]].groupby(["bucket", "participation_bin"]).sum("n_bxs").reset_index()
epoch_names = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)
df_bucket["epoch"] = epoch_names
df_bucket = df_bucket[["participation_bin", "n_bxs", "epoch"]].pivot(index="participation_bin", columns=["epoch"])


px.imshow(
    df_bucket.to_numpy(),
    labels=dict(x="Epochs", y="Participation rate", color="Frequency"),
    x = sorted(list(set(epoch_names))),
    y = [str(s) for s in np.flip(np.arange(int(min(df["participation_rate"])), 100))],
    color_continuous_scale='blues'
)


mean = df['participation_rate'].mean()
std = df['participation_rate'].std()
mini = min(df['participation_rate'])
median = df['participation_rate'].quantile(0.5)
maxi = max(df['participation_rate'])

print("           participation statistics")
print("-----------------------------------------------")
print("mean: {}".format(mean))
print("standard devidation: {}".format(std))
print("")
print("minimum: {}".format(mini))
print("median: {}".format(median))
print("maximum: {}".format(maxi))

           participation statistics
-----------------------------------------------
mean: 99.0554344742395
standard devidation: 0.823213998659587

minimum: 93.9082325
median: 99.3405521
maximum: 99.7540593


px.line(x=df['epoch'], y=df['exit_count'], labels = {"x": "Epoch", "y": "Number of exits"}, title = "Number of voluntary exits")


fig = px.scatter(
    df[df.deposits > 0], x = 'epoch', y = 'temp', size = 'deposits',
    size_max = 20, width = 800, height = 400, labels = {"epoch": "Epoch"})
fig.update_yaxes(visible=False)

An Introduction to Oceanic Games¶

Introducing the Oceanic Games Model¶

Analysis¶

Limitations of the Notebook¶

The Beacon Chain Digest - June 8th¶

Attester and proposer slashing¶

Proposed blocks count¶

Participation rate¶

Exit counts¶

Deposit counts¶