from web3 import Web3
import json
import requests
import csv
import pandas as pd
import seaborn as sns 
import numpy as np
import matplotlib.pyplot as plt
from time import *
import plotly.express as px
import plotly.io as pio
pd.options.plotting.backend = "plotly"
pio.renderers.default = "plotly_mimetype+notebook_connected"
import plotly.graph_objects as go
import math
from datetime import datetime


with open('infura_url.txt', 'r') as file:
    infura_url = file.read()

web3 = Web3(Web3.HTTPProvider(infura_url))
web3.isConnected()

True


contract_address = web3.toChecksumAddress('0xae7ab96520de3a18e5e111b5eaab095312d7fe84')
abi = json.loads('[{"constant":true,"inputs":[],"name":"proxyType","outputs":[{"name":"proxyTypeId","type":"uint256"}],"payable":false,"stateMutability":"pure","type":"function"},{"constant":true,"inputs":[],"name":"isDepositable","outputs":[{"name":"","type":"bool"}],"payable":false,"stateMutability":"view","type":"function"},{"constant":true,"inputs":[],"name":"implementation","outputs":[{"name":"","type":"address"}],"payable":false,"stateMutability":"view","type":"function"},{"constant":true,"inputs":[],"name":"appId","outputs":[{"name":"","type":"bytes32"}],"payable":false,"stateMutability":"view","type":"function"},{"constant":true,"inputs":[],"name":"kernel","outputs":[{"name":"","type":"address"}],"payable":false,"stateMutability":"view","type":"function"},{"inputs":[{"name":"_kernel","type":"address"},{"name":"_appId","type":"bytes32"},{"name":"_initializePayload","type":"bytes"}],"payable":false,"stateMutability":"nonpayable","type":"constructor"},{"payable":true,"stateMutability":"payable","type":"fallback"},{"anonymous":false,"inputs":[{"indexed":false,"name":"sender","type":"address"},{"indexed":false,"name":"value","type":"uint256"}],"name":"ProxyDeposit","type":"event"}]')


df1 = pd.read_csv('import_file_1.csv', index_col=False, low_memory=False)
df2 = pd.read_csv('import_file_2.csv', index_col=False, low_memory=False)

frames = [df1, df2]
df = pd.concat(frames)


df_pruned = df.drop_duplicates(subset = 'Txhash', keep = 'first')
print(len(df_pruned))

1856


deposit_transactions = df_pruned['TxTo'] == '0x00000000219ab540356cbb839cbe05303d7705fa'
stEth_token_transactions = df_pruned['TxTo'] == '0xae7ab96520de3a18e5e111b5eaab095312d7fe84' 
df_pruned_deposit_transactions = df_pruned[deposit_transactions]
df_pruned_stEth_token_transactions = df_pruned[stEth_token_transactions]
zero_value_transactions = df_pruned_stEth_token_transactions['Value_IN(ETH)'] == 0
df_pruned_zero_value_transactions = df_pruned_stEth_token_transactions[zero_value_transactions]
print(len(df_pruned_deposit_transactions))
print(len(df_pruned_stEth_token_transactions))
#print(len(df_pruned_zero_value_transactions))

195
1661


df_pruned_deposit_transactions.to_csv('lido_deposits.csv', index = False)
df_pruned_stEth_token_transactions.to_csv('lido_stEth_token_transactions.csv', index = False)


txn_hash_deposit_transactions = df_pruned_deposit_transactions.iloc[:, 0]
data_list_eth2_deposits = []
txn_hash_stEth_token_transactions = df_pruned_stEth_token_transactions.iloc[:, 0]
data_list_stEth_token_transactions = []


for i in txn_hash_deposit_transactions:
    #print(i)
    data_list_eth2_deposits.append(web3.eth.get_transaction(i))


for i in txn_hash_stEth_token_transactions:
    #print(i)
    data_list_stEth_token_transactions.append(web3.eth.get_transaction(i))


df_gas_deposits = pd.DataFrame(data_list_eth2_deposits)

df_gas_stEth_toekn_transactions = pd.DataFrame(data_list_stEth_token_transactions)

# print(df_deposit_transactions)
# print(df_stEth_token_transactions)


df_gas_deposits.to_csv('lido_deposits_with_gas.csv', index = False)
df_gas_stEth_toekn_transactions.to_csv('lido_stEth_token_transactions_with_gas.csv', index = False)


df_deposit_transactions_pairs = df_pruned_deposit_transactions.groupby(['ParentTxFrom','ParentTxTo', 'TxTo', 'From']).size().reset_index().rename(columns={0:'count'})
df_deposit_transactions_pairs.sort_values(["count"], ascending=False)


df_lido_deposits_with_gas = pd.read_csv("lido_deposits_with_gas.csv")
df_gas = pd.read_csv("gas_fee_data.csv")

# x = df_lido_deposits_with_gas["blockNumber"]
y = df_lido_deposits_with_gas["gasPrice"]
y1 = df_gas["Value (Wei)"]
lst = []
lst1 = []

#lst2 = []
x = df_lido_deposits_with_gas["blockNumber"] 

# for t in x:
#     temp = web3.eth.get_block(t)['timestamp']
#     lst2.append(datetime.fromtimestamp(temp))

for i in y:
    #lst.append(int(i)/(10**8))
    lst.append(Web3.fromWei(int(i), 'ether'))
for j in y1:
    lst1.append(Web3.fromWei(j, 'ether'))
fig = px.scatter(x = lst2 ,y = lst, title = "Gas prices of Lido deposit transactions")
fig.update_layout(xaxis_title = "Date", yaxis_title = "Gas Price (Eth)")
fig.show()
fig1 = px.scatter(x = df_gas["Date(UTC)"] ,y = lst1, title = "Average gas prices for that period of time")
fig1.update_layout(xaxis_title = "Date(UTC)", yaxis_title = "Gas Price (Eth)")
fig1.show()


files = ["attestor_slashing", "proposer_slashing", "block_count", "participation_rate", "exit_count", "deposits"]
dfs = []

for file in files:
    df = pd.read_csv(f"{file}.csv", header=None, names=["epoch", file])
    df.dropna(subset=["epoch"], inplace=True)
    dfs += [df[[file]]] # We don't want the epoch column

df = pd.concat([df[["epoch"]]] + dfs, axis=1) # Concat everything, with the epoch column first
df["participation_rate"] *= 100 # Set to percentages
df = df[df.epoch < max(df["epoch"])] # Remove last epoch (queried too soon)
df["epoch"] = df["epoch"].astype(int)


rng = np.random.default_rng(42)
df['temp'] = rng.uniform(0, 10, len(df["epoch"]))
fig = px.scatter(
    df[df.attestor_slashing > 0], x = 'epoch', y = 'temp', size = 'attestor_slashing',
    size_max = 20, labels = {"epoch": "Epoch"},
    title = f"Attester slashings"
)
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


fig = px.scatter(
    df[df.proposer_slashing > 0], x = 'epoch', y = 'temp', size = 'proposer_slashing',
    size_max = 20, labels = {"epoch": "Epoch"},
    title = f"Proposer slashings"
)
fig.update_xaxes(range=(min(df["epoch"]), max(df["epoch"])))
fig.update_yaxes(visible=False)


bucket_size = 200
df["bucket"] = np.floor_divide(df["epoch"], bucket_size)
df["n_bxs"] = 1
df_bucket = df[["bucket", "block_count", "n_bxs"]].groupby(["bucket", "block_count"]).sum("n_bxs").reset_index()
df_bucket["epoch"] = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)

fig = px.scatter(df_bucket, x = 'epoch', y = 'block_count', size = 'n_bxs',
                 labels={ "block_count": "Blocks produced", "epoch": "Epoch", "n_bxs": "Count" },
                 title = f"Block count in intervals of {bucket_size} epochs")
fig


block_freq = df[['block_count']].value_counts(normalize=True).rename_axis('block_count').reset_index(name='freq')
block_freq["freq"] *= 100
px.bar(
    block_freq, x="block_count", y="freq", labels={"block_count": "Blocks per epoch", "freq": "Frequency (%)"}
)


bins = pd.IntervalIndex.from_tuples([(i,i+1) for i in range(int(min(df["participation_rate"])), 100)][::-1])
df["participation_bin"] = pd.cut(df["participation_rate"], bins)
df_bucket = df[["bucket", "participation_bin", "n_bxs"]].groupby(["bucket", "participation_bin"]).sum("n_bxs").reset_index()
epoch_names = df_bucket.bucket.apply(
    lambda bucket: f"{max(min(df['epoch']), bucket * bucket_size)}-{min(max(df['epoch']), (bucket + 1) * bucket_size)}"
)
df_bucket["epoch"] = epoch_names
df_bucket = df_bucket[["participation_bin", "n_bxs", "epoch"]].pivot(index="participation_bin", columns=["epoch"])

px.imshow(
    df_bucket.to_numpy(),
    labels=dict(x="Epochs", y="Participation rate", color="Frequency"),
    x = sorted(list(set(epoch_names))),
    y = [str(s) for s in np.flip(np.arange(int(min(df["participation_rate"])), 100))],
    color_continuous_scale='blues'
)


mean = df['participation_rate'].mean()
std = df['participation_rate'].std()
mini = min(df['participation_rate'])
median = df['participation_rate'].quantile(0.5)
maxi = max(df['participation_rate'])

print("           participation statistics")
print("-----------------------------------------------")
print("mean: {}".format(mean))
print("standard devidation: {}".format(std))
print("")
print("minimum: {}".format(mini))
print("median: {}".format(median))
print("maximum: {}".format(maxi))

           participation statistics
-----------------------------------------------
mean: 99.0559773379996
standard devidation: 0.8162056384388161

minimum: 94.4651424884796
median: 99.37724471092224
maximum: 99.78379607200624


fig = px.histogram(df, x="participation_rate", marginal="rug")
fig.show()


px.line(x=df['epoch'], y=df['exit_count'], labels = {"x": "Epoch", "y": "Number of exits"}, title = "Number of voluntary exits")


fig = px.scatter(
    df[df.deposits > 0], x = 'epoch', y = 'temp', size = 'deposits',
    size_max = 20, labels = {"epoch": "Epoch"})
fig.update_yaxes(visible=False)

Motivation¶

Lido stETH Token¶

Methodology¶

Internal transactions¶

Initial thoughts¶

Inferences¶

stETH Token contract¶

Vyper_contract¶

Gas fees for transactions¶

The Beacon Chain Digest - July 7th¶

Attester and proposer slashing¶

Proposed block count¶

Participation rate¶

Exit counts¶

Deposit counts¶

	ParentTxFrom	ParentTxTo	TxTo	From	count
2	0x6352f8c749954c9df198cf72976e48994a77cce2	0x1ee5c83c4b43aaed21613d5cc7835d36078ce03f	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	72
5	0xa76a7d0d06754e4fc4941519d1f9d56fd9f8d53b	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	53
0	0x00444797ba158a7bdb8302e72da98dcbccef0fbc	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	36
1	0x073adf97f6de257d76e67f7c2fe57ac9843cca25	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	25
6	0xc8381ca290c198f5ab739a1841ce8aedb0b330d5	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	5
3	0x6e34e47df7026e0ace9457f930f1cfada6f547c4	0x1ee5c83c4b43aaed21613d5cc7835d36078ce03f	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	3
4	0x99b2c5d50086b02f83e791633c5660fbb8344653	0x1ee5c83c4b43aaed21613d5cc7835d36078ce03f	0x00000000219ab540356cbb839cbe05303d7705fa	0xae7ab96520de3a18e5e111b5eaab095312d7fe84	1