-
Notifications
You must be signed in to change notification settings - Fork 29
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
post_processing(): rewrite and added new columns as requested in #45
- Loading branch information
1 parent
d72180f
commit f7fe982
Showing
1 changed file
with
82 additions
and
35 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,35 +1,82 @@ | ||
from pandas import DataFrame | ||
from decimal import Decimal | ||
|
||
def append_to_list(dictionary, key, value): | ||
if dictionary.get(key) is None: | ||
dictionary[key] = [] | ||
dictionary[key].append(value) | ||
|
||
|
||
def post_processing(df: DataFrame) -> DataFrame: | ||
sim_dict = {} | ||
for i, row in df.iterrows(): | ||
idx_pool = row['pool'] | ||
for token in idx_pool['tokens']: | ||
append_to_list(sim_dict, f'token_{token.lower()}_balance', Decimal(idx_pool['tokens'][token].balance)) | ||
append_to_list(sim_dict, f'token_{token.lower()}_weight', idx_pool['tokens'][token].weight) | ||
append_to_list(sim_dict, f'token_{token.lower()}_denorm_weight', idx_pool['tokens'][token].denorm_weight) | ||
append_to_list(sim_dict, 'generated_fees', idx_pool['generated_fees']) | ||
append_to_list(sim_dict, 'pool_shares', idx_pool['pool_shares']) | ||
|
||
idx_token_prices = row.get('token_prices') | ||
if idx_token_prices is not None: | ||
for token in idx_token_prices: | ||
append_to_list(sim_dict, f'token_{token.lower()}_price', idx_token_prices[token]) | ||
|
||
idx_spot_prices = row.get('spot_prices') | ||
if idx_spot_prices is not None: | ||
for token in idx_spot_prices: | ||
append_to_list(sim_dict, f'token_{token.lower()}_spot_price', idx_spot_prices[token]) | ||
|
||
rest_keys = list(filter(lambda key: key != 'token_prices' and key != 'pool' and key != 'spot_prices', df.columns)) | ||
for key in rest_keys: | ||
append_to_list(sim_dict, key, row[key]) | ||
processed_df = DataFrame.from_dict(sim_dict) | ||
return processed_df | ||
import pandas as pd | ||
import typing | ||
|
||
def unpack_column_tokens(column_tokens: pd.Series, token_symbols: typing.List[str]) -> pd.DataFrame: | ||
di = {} | ||
for symbol in token_symbols: | ||
di[f'token_{symbol}_balance'] = [] | ||
di[f'token_{symbol}_denorm_weight'] = [] | ||
di[f'token_{symbol}_weight'] = [] | ||
for r in column_tokens: | ||
di[f'token_{symbol}_weight'].append(r[symbol.upper()].weight) | ||
di[f'token_{symbol}_denorm_weight'].append(r[symbol.upper()].denorm_weight) | ||
di[f'token_{symbol}_balance'].append(r[symbol.upper()].balance) | ||
return pd.DataFrame.from_dict(di) | ||
|
||
def unpack_column_pool(df: pd.DataFrame) -> pd.DataFrame: | ||
column_pool = pd.DataFrame.from_records(df["pool"].to_list()) | ||
token_symbols = assets_in_df(df) | ||
column_tokens = column_pool["tokens"] | ||
column_tokens_unpacked = unpack_column_tokens(column_tokens, token_symbols) | ||
return column_pool.assign(**column_tokens_unpacked).drop("tokens", axis=1) | ||
|
||
def unpack_column_token_prices(df: pd.DataFrame) -> pd.DataFrame: | ||
column_token_prices = df["token_prices"] | ||
token_symbols = assets_in_df(df) | ||
di = {} | ||
for symbol in token_symbols: | ||
di[f'token_{symbol}_price'] = [] | ||
for r in column_token_prices: | ||
di[f'token_{symbol}_price'].append(r[symbol.upper()]) | ||
return pd.DataFrame.from_dict(di) | ||
|
||
# At this point I should generalize the "unpacking" pattern, but then it'd be even harder to follow once I've forgotten everything | ||
def unpack_column_spot_prices(df: pd.DataFrame) -> pd.DataFrame: | ||
column_spot_prices = df.spot_prices | ||
# Can't assets_in_df() here because this column might not include spot_prices for all assets in df (why?) | ||
token_symbols = list(column_spot_prices[0].keys()) | ||
token_symbols.sort() | ||
di = {} | ||
for symbol in token_symbols: | ||
symbol_low = symbol.lower() | ||
di[f'token_{symbol_low}_spot_price'] = [] | ||
for r in column_spot_prices: | ||
di[f'token_{symbol_low}_spot_price'].append(r[symbol]) | ||
return pd.DataFrame.from_dict(di) | ||
|
||
def assets_in_df(df: pd.DataFrame) -> typing.List[str]: | ||
assets = list(df.pool[0]["tokens"].keys()) | ||
assets.sort() | ||
assets = [a.lower() for a in assets] | ||
return assets | ||
|
||
def calc_token_x_value(df: pd.DataFrame) -> pd.DataFrame: | ||
symbols = assets_in_df(df) | ||
di = {} | ||
for s in symbols: | ||
di[f'token_{s}_value'] = df[f'token_{s}_balance'].astype(float) * df[f'token_{s}_price'] | ||
return pd.DataFrame.from_dict(di) | ||
|
||
def post_processing(df: pd.DataFrame) -> pd.DataFrame: | ||
unpacked_column_pool = unpack_column_pool(df) | ||
unpacked_column_token_prices = unpack_column_token_prices(df) | ||
unpacked_column_spot_prices = unpack_column_spot_prices(df) | ||
|
||
df = df.assign(**unpacked_column_pool).assign(**unpacked_column_token_prices).assign(**unpacked_column_spot_prices) | ||
|
||
# Calculate token_{x}_value columns | ||
token_x_value = calc_token_x_value(df) | ||
df = df.assign(**token_x_value) | ||
|
||
# Calculate TVL column | ||
symbols = assets_in_df(df) | ||
token_value_columns = [f'token_{s}_value' for s in symbols] | ||
column_tvl = df[token_value_columns].sum(axis=1) | ||
df = df.assign(tvl=column_tvl) | ||
|
||
# Calculate total_token_balances | ||
token_balance_columns = [f'token_{s}_balance' for s in symbols] | ||
column_total_token_balances = df[token_balance_columns].sum(axis=1) | ||
df = df.assign(total_token_balances=column_total_token_balances) | ||
|
||
return df |