In [1]:
import pandas as pd
import numpy as np
import re
def format_bigquery_column_names(nftfi):
    # Remove special charachters
    nftfi.columns = [re.sub(r'[^a-zA-Z0-9\s]+', '', column) for column in nftfi.columns]
    # Remove spaces at beginning and end
    nftfi.columns = nftfi.columns.str.strip()
    # Replace spaces with underscore
    nftfi.columns = nftfi.columns.str.replace(' ', '_')
    # Define a function to convert camel-case to kebab-case
    def camel_to_kebab(s):
        # Replace consecutive capital letters with a single lowercase letter
        s = re.sub(r'(?<=[a-z])(?=[A-Z])', '_', s)
        # Convert remaining camel-case string to kebab-case
        s = re.sub(r'(?<!^)(?<!_)(?=[A-Z])(?![A-Z])', '_', s).lower()
        return s
    # Apply the function to all column names
    nftfi.columns = nftfi.columns.map(camel_to_kebab)
    return nftfi



## Load tables

In [2]:
try: 
    mq = pd.read_csv('mq.csv')
except FileNotFoundError:
    mq = pd.read_csv('analysis/mq.csv')
nftfi = pd.read_csv('../analytics_bot_langchain/data/nftfi/loans_with_transaction_hash.csv')
nftfi = format_bigquery_column_names(nftfi)
nftfi = nftfi.rename(columns={'loan_id': 'loan_no', 'loan_date': 'date'})


In [3]:
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)


In [4]:
print('MQ')
display(mq.head(2))
print('\n--------------------------------------------------------------------')
print('\n\nNFTfi')
display(nftfi.head(2))

MQ


Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool
0,0x933ff7d3b9d60593c97a5c9ab28205e54f019259defd...,2022-02-26 09:26:37.000000 UTC,-4882,0x676f3d2c9f5776e09d23986adc6684fb41e9000e,0x0aff497bd016000185b1c8302fa98a88ff4a4178,0.8,0.826624,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-03-28 09:26:37.000000 UTC,30.0,0.405,1378,0x026224a2940bfe258d0dbe947919b62fe321f042,nftfi,2205.66016,False,14280871,p2p
1,0xd1b9fbddbcaaaea8fa8b19cfa53c5e9093993f0d51c0...,2022-04-19 22:33:16.000000 UTC,733,0x676f3d2c9f5776e09d23986adc6684fb41e9000e,0x2c35b3d207f745ad5b17d88328286c49a0ce4d4f,1.4,1.413425,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-26 22:33:16.000000 UTC,7.0,0.500013,1378,0x026224a2940bfe258d0dbe947919b62fe321f042,nftfi,4339.42642,False,14618284,p2p



--------------------------------------------------------------------


NFTfi


Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,loan_apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price
0,v1.loan.fixed-0,0,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,30000000000000000,35000000000000000,7,869.047619,1589580384,2020-05-15T22:06:24.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10073259,0x7c7675a6613ddaded0b187314c2edd3ad3c5428a7a14...,17782723583,1000000,436882,3212704,17782723583,1.0,,2020-05-16T09:25:02.000Z,34750000000000000,0x3e24b9cd4c0208acc25259d4fcbddf75b48a554d6814...,19000000000.0,500000.0,120497.0,9549420.0,19000000000.0,250000000000000,,,,,,,
1,v1.loan.fixed-1,1,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,3000000000000000,3100000000000000,7,173.809524,1589623507,2020-05-16T10:05:07.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10076484,0x937a5320404c0c835f2739c84b229ef837a9f0b0ef92...,19755020080,500000,441106,9710213,19755020080,1.0,,2020-05-16T11:50:26.000Z,3095000000000000,0x59d1c26160b7bdde716b380364b506e056d852ac1b36...,16974490000.0,500000.0,122603.0,9470068.0,16974490000.0,5000000000000,,,,,,,


In [5]:
mq['loan_id'].head(2)

0   -4882
1     733
Name: loan_id, dtype: int64

### Clean data

In [6]:
# clean loan IDs to try and compare them
mq['loan_id_cleaned'] = mq['loan_id'].astype(str).str.replace('-','')
nftfi['loan_no_cleaned'] = nftfi['loan_no'].str.split('-').apply(lambda x: x[-1])
nftfi

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,loan_apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned
0,v1.loan.fixed-0,0,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,30000000000000000,35000000000000000,7,869.047619,1589580384,2020-05-15T22:06:24.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10073259,0x7c7675a6613ddaded0b187314c2edd3ad3c5428a7a14...,17782723583,1000000,436882,3212704,17782723583,1.0,,2020-05-16T09:25:02.000Z,34750000000000000,0x3e24b9cd4c0208acc25259d4fcbddf75b48a554d6814...,1.900000e+10,500000.0,120497.0,9549420.0,1.900000e+10,250000000000000,,,,,,,,0
1,v1.loan.fixed-1,1,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,3000000000000000,3100000000000000,7,173.809524,1589623507,2020-05-16T10:05:07.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10076484,0x937a5320404c0c835f2739c84b229ef837a9f0b0ef92...,19755020080,500000,441106,9710213,19755020080,1.0,,2020-05-16T11:50:26.000Z,3095000000000000,0x59d1c26160b7bdde716b380364b506e056d852ac1b36...,1.697449e+10,500000.0,122603.0,9470068.0,1.697449e+10,5000000000000,,,,,,,,1
2,v1.loan.fixed-2,2,v1.loan.fixed,repaid,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,0xc35A5FEc6BE6957899E15559Be252Db882220b37,30000000000000000,30100000000000000,7,17.380952,1589628655,2020-05-16T11:30:55.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10076867,0xf331e9fb8341f1b644e0edfe599a56402836808b2570...,12100000000,500000,403060,9269753,12100000000,1.0,,2020-05-16T12:20:16.000Z,30095000000000000,0xfa036df32071d8b4f301b34aa2893bc0499db7e79bf1...,1.320000e+10,500000.0,132834.0,4140219.0,1.320000e+10,5000000000000,,,,,,,,2
3,v1.loan.fixed-3,3,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,3000000000000000,3010000000000000,7,17.380952,1589631935,2020-05-16T12:25:35.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10077100,0x330e8f56d4f6eb07392d8c23858eda1cada42c550ed9...,15430188679,500000,428215,2708977,15430188679,1.0,,2020-05-16T12:28:51.000Z,3009500000000000,0x8f70de246186ae66da45404c856b9db431b26bfcbe7f...,1.310000e+10,500000.0,122603.0,9570320.0,1.310000e+10,500000000000,,,,,,,,3
4,v1.loan.fixed-4,4,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,200000000000000000,250000000000000000,7,1303.571429,1589633522,2020-05-16T12:52:02.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10077208,0x9bd7a9da5505b3d42152dd5f971378daeb6a0e74a0ef...,14000000000,500000,441098,9403518,14000000000,1.0,,2020-05-16T12:56:27.000Z,247500000000000000,0x0eaead5004befd758f4f4a7c04241098eaa9948192e2...,2.100000e+10,500000.0,132203.0,4175144.0,2.100000e+10,2500000000000000,,,,,,,,4
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
40750,v2-1.loan.fixed-33827,33827,v2-1.loan.fixed,,0x887b86B6B6957F7bbeA88B8CEfD392f39236A88C,0x73A1Bb338613291AC6530870Fe2c5D354BFEC17e,600000000,622191781,30,45.000000,1682367647,2023-04-24T20:20:47.000Z,0xA0b86991c6218b36c1d19D4a2e9Eb0cE3606eB48,17118481,0xfd2ae7f526cc0dd5d154e4a24b7d5531201e1b70fab5...,46000000000,490745,480957,6695289,46000000000,,,,,,,,,,,,,,,,,,,33827
40751,v2.loan.fixed.collection-33811,33811,v2.loan.fixed.collection,,0xeE8Cd54223A93DD9B3B2C4701cb1Be5f6886C366,0x818ec19eBE023b4774799fdB39F0b20aF39571FE,99000000000000000000,99732329000000000000,30,9.000003,1682362607,2023-04-24T18:56:47.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,17118066,0x1ae59b0a6f064d5877d1cb7daf822fbeb6d861be40f8...,52268898606,499431,484843,10219934,52268898606,,,,,,,,,,,,,,,,,,,33811
40752,v2.loan.fixed.collection-33814,33814,v2.loan.fixed.collection,,0xCffC336E6D019C1aF58257A0b10bf2146a3f42A4,0x1eC627158650fF5dB5d6FCe7C1Ed6e0086D94F5f,52555000000000000000000,52986526945000000000000,30,9.990000,1682363507,2023-04-24T19:11:47.000Z,0x6B175474E89094C44Da98b954EedeAC495271d0F,17118141,0xc95639c3fe6ffd6062ab914ce7dcbf693ccbdd454573...,49319816314,522723,512935,6979618,49319816314,,,,,,,,,,,,,,,,,,,33814
40753,v2.loan.fixed.collection-33817,33817,v2.loan.fixed.collection,,0xCffC336E6D019C1aF58257A0b10bf2146a3f42A4,0x1eC627158650fF5dB5d6FCe7C1Ed6e0086D94F5f,52555000000000000000000,52986526945000000000000,30,9.990000,1682363555,2023-04-24T19:12:35.000Z,0x6B175474E89094C44Da98b954EedeAC495271d0F,17118145,0x837a2f77681fe4b192c1721eaf042ea7518a5315a916...,45264530207,505623,495835,15156691,45264530207,,,,,,,,,,,,,,,,,,,33817


In [7]:
display(mq['loan_id_cleaned'])
display(nftfi['loan_no_cleaned'])

0         4882
1          733
2        31180
3        27589
4        23358
         ...  
22037    20293
22038    20292
22039    20291
22040    20290
22041    20288
Name: loan_id_cleaned, Length: 22042, dtype: object

0            0
1            1
2            2
3            3
4            4
         ...  
40750    33827
40751    33811
40752    33814
40753    33817
40754    33826
Name: loan_no_cleaned, Length: 40755, dtype: object

In [8]:
mq.shape[0], nftfi.shape[0]

(22042, 40755)

In [9]:
# Check minimum and maximum dates of each table
print(f"min mq date: {mq.block_timestamp.min()}; max mq date: {mq.block_timestamp.max()}")
print(f"min nftfi date: {nftfi.date.min()}; max nftfi date: {nftfi.date.max()}")

min mq date: 2020-10-15 18:15:24.000000 UTC; max mq date: 2023-05-18 12:41:47.000000 UTC
min nftfi date: 2020-05-15T22:06:24.000Z; max nftfi date: 2023-04-24T20:20:47.000Z


In [10]:
mq.loc[mq.loan_id_cleaned.duplicated()==True].sort_values('loan_id_cleaned')

Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned
17754,0x853126067767f771040544ccf90f6a6e39c6328c442d...,2021-07-25 21:41:20.000000 UTC,-1001,0xae00360a54b97723c236093bd272b1b06efc14cd,0x82ba2d6184cb07c46687a89a62c4a9b5c584e87d,30.000,30.493151,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2021-08-24 21:41:20.000000 UTC,30.0,0.200000,18237,0x7bd29408f11d2bfc23c34f18275bbf23bb716bc7,nftfi,64742.160000,False,12897889,p2p,1001
11490,0x40739bfb7332c87bcb4b7037a8d15cb11c68c759a6cc...,2021-07-25 22:23:33.000000 UTC,-1002,0xade44991d931ca62e4b56f59a7a8e9160067f48a,0x6954d0255cfed71d55ad8b371b4170b8bf7709dc,0.200,0.204932,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2021-10-23 22:23:33.000000 UTC,90.0,0.100000,150280,0x50f5474724e0ee42d9a4e711ccfb275809fd6d4a,nftfi,432.446340,False,12898074,p2p,1002
19867,0x7b8f201bef86240d984f82ead58e61779e480c786941...,2022-04-22 22:45:07.000000 UTC,1009,0xd2db35024d1817defd4bb8617bdd7f05c07a870e,0x768f2a7ccdfde9ebdfd5cea8b635dd590cb3a3f1,24.000,24.710137,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-22 22:45:07.000000 UTC,30.0,0.360000,6049,0x8a90cab2b38dba80c64b7734e58ee1db38b8992e,nftfi,71154.048000,False,14637423,p2p,1009
8061,0xe4d7745df19b8e93e11fa5bb6fd0ab2472de80849628...,2022-04-22 23:29:20.000000 UTC,1010,0xb2a2a6a69e7a0ad66943f4c2869d45a9919cf740,0x613593559d211a55ee00797b1aed4abcca214209,0.385,0.396814,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-06 23:29:20.000000 UTC,14.0,0.800020,3030,0x42069abfe407c60cf4ae4112bedead391dba1cdb,nftfi,1139.224394,False,14637621,p2p,1010
8060,0x3c5db775c42168bca6b3df3ca028b43136931bfaaadd...,2022-04-22 23:41:27.000000 UTC,1011,0xb2a2a6a69e7a0ad66943f4c2869d45a9919cf740,0x613593559d211a55ee00797b1aed4abcca214209,0.385,0.396814,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-06 23:41:27.000000 UTC,14.0,0.800020,2391,0x42069abfe407c60cf4ae4112bedead391dba1cdb,nftfi,1139.224394,False,14637680,p2p,1011
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
19719,0xfbb30b44e9824770d84a15361b094e6a9a8aea33c338...,2022-04-21 22:54:16.000000 UTC,869,0xc35f3f92a9f27a157b309a9656cfea30e5c9cce3,0x3caf4d085a67e4beb3ec5364704881172b1830c8,9.000,9.887671,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-07-20 22:54:16.000000 UTC,90.0,0.400000,5554,0x8a90cab2b38dba80c64b7734e58ee1db38b8992e,nftfi,27028.056600,False,14631062,p2p,869
19718,0x911401ad5f892108602b797b5d94a04e7e236368350e...,2022-04-21 23:05:30.000000 UTC,870,0xc35f3f92a9f27a157b309a9656cfea30e5c9cce3,0x3caf4d085a67e4beb3ec5364704881172b1830c8,10.110,11.107151,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-07-20 23:05:30.000000 UTC,90.0,0.400000,5592,0x8a90cab2b38dba80c64b7734e58ee1db38b8992e,nftfi,30167.461530,False,14631114,p2p,870
19235,0x2883f40fd8879958105f438469292bbddd538609bda7...,2022-04-22 00:44:31.000000 UTC,889,0x648a58121dc0de4436837dc585ded4fa5fba6d3e,0x0aff497bd016000185b1c8302fa98a88ff4a4178,9.000,9.669378,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-22 00:44:31.000000 UTC,30.0,0.904900,2225,0x8a90cab2b38dba80c64b7734e58ee1db38b8992e,nftfi,26857.404000,False,14631573,p2p,889
20299,0x8460d4842534c4ae3c7aafbe610088636e4f2f8c9562...,2022-04-22 04:20:25.000000 UTC,949,0x8ad59324604e2170f45c12a5ba992e80648987ed,0xcb43971645190ca9181f26e4f40eade20d51f39f,9.500,10.413562,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-07-21 04:20:25.000000 UTC,90.0,0.390000,5294,0x8a90cab2b38dba80c64b7734e58ee1db38b8992e,nftfi,28458.008100,False,14632509,p2p,949


In [11]:
nftfi.head(2)

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,loan_apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned
0,v1.loan.fixed-0,0,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,30000000000000000,35000000000000000,7,869.047619,1589580384,2020-05-15T22:06:24.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10073259,0x7c7675a6613ddaded0b187314c2edd3ad3c5428a7a14...,17782723583,1000000,436882,3212704,17782723583,1.0,,2020-05-16T09:25:02.000Z,34750000000000000,0x3e24b9cd4c0208acc25259d4fcbddf75b48a554d6814...,19000000000.0,500000.0,120497.0,9549420.0,19000000000.0,250000000000000,,,,,,,,0
1,v1.loan.fixed-1,1,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,3000000000000000,3100000000000000,7,173.809524,1589623507,2020-05-16T10:05:07.000Z,0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2,10076484,0x937a5320404c0c835f2739c84b229ef837a9f0b0ef92...,19755020080,500000,441106,9710213,19755020080,1.0,,2020-05-16T11:50:26.000Z,3095000000000000,0x59d1c26160b7bdde716b380364b506e056d852ac1b36...,16974490000.0,500000.0,122603.0,9470068.0,16974490000.0,5000000000000,,,,,,,,1


In [12]:
print('MQ:\n')
print("Are loan_id unique? Once grouped by unique, the counts are: ")
mq_loan_id_count = pd.DataFrame(mq.groupby('loan_id').agg('count')['transaction_hash'])
mq_loan_id_count = mq_loan_id_count.reset_index()

display(mq_loan_id_count['transaction_hash'].unique())
display(mq_loan_id_count.loc[mq_loan_id_count['transaction_hash']>1])
duplicated_mq_loans = pd.merge(left=mq, right=mq_loan_id_count.loc[mq_loan_id_count['transaction_hash']>1], left_on='loan_id', right_on='loan_id')
display(duplicated_mq_loans)
display(duplicated_mq_loans.amt_in_usd.sum())
print("Are loan_id_cleaned unique? Once grouped by loan_id_cleaned, the counts are: ")
display(mq.groupby('loan_id_cleaned').agg('count')['transaction_hash'].unique())


MQ:

Are loan_id unique? Once grouped by unique, the counts are: 


array([1, 2])

Unnamed: 0,loan_id,transaction_hash
177,-6545,2
537,-5752,2
538,-5751,2
14879,21523,2
16152,24224,2
19041,30521,2
19042,30522,2
19043,30523,2


Unnamed: 0,transaction_hash_x,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned,transaction_hash_y
0,0x7b88f5fb4c44e2ad1382c9f2174a077d15d628878e85...,2022-04-04 06:24:18.000000 UTC,-6545,0x648a58121dc0de4436837dc585ded4fa5fba6d3e,0x0aff497bd016000185b1c8302fa98a88ff4a4178,1.2,1.28925,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-04 06:24:18.000000 UTC,30.0,0.905,818,0x2acab3dea77832c09420663b0e1cb386031ba17b,nftfi,4208.42436,False,14517889,p2p,6545,2
1,0x7b88f5fb4c44e2ad1382c9f2174a077d15d628878e85...,2022-04-04 06:24:18.000000 UTC,-6545,0x648a58121dc0de4436837dc585ded4fa5fba6d3e,0x0aff497bd016000185b1c8302fa98a88ff4a4178,1.2,1.28925,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-05-04 06:24:18.000000 UTC,30.0,0.905,818,0x2acab3dea77832c09420663b0e1cb386031ba17b,nftfi,4208.42436,False,14517889,p2p,6545,2
2,0xbbd45783e2cd294f86ec604831eeeca7be8bd844818e...,2023-01-18 06:03:35.000000 UTC,21523,0x45d1a3acee4b57f5bb078a14d993364f80e86657,0xebd0db1bfaa50e7abe52412644e968166f349755,0.9,0.923819,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-02-01 06:03:35.000000 UTC,14.0,0.689995,1662,0x394e3d3044fc89fcdd966d3cb35ac0b32b0cda91,nftfi,1428.82479,False,16431774,p2p,21523,2
3,0xbbd45783e2cd294f86ec604831eeeca7be8bd844818e...,2023-01-18 06:03:35.000000 UTC,21523,0x45d1a3acee4b57f5bb078a14d993364f80e86657,0xebd0db1bfaa50e7abe52412644e968166f349755,0.9,0.923819,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-02-01 06:03:35.000000 UTC,14.0,0.689995,1662,0x394e3d3044fc89fcdd966d3cb35ac0b32b0cda91,nftfi,1428.82479,False,16431774,p2p,21523,2
4,0x205c9f50b22b5a4751b14e09efb1eacc757ede76ca42...,2023-03-26 16:43:47.000000 UTC,30522,0x48cf6acbcba1c8fe470827c6739a80c360ccc326,0x0b8428004ab7fea256dbc6e7c6412381cb173e8a,0.6,0.618181,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-04-09 16:43:47.000000 UTC,14.0,0.790008,365,0x64a1c0937728d8d2fa8cd81ef61a9c860b7362db,nftfi,1058.6076,False,16912865,p2p,30522,2
5,0x205c9f50b22b5a4751b14e09efb1eacc757ede76ca42...,2023-03-26 16:43:47.000000 UTC,30522,0x48cf6acbcba1c8fe470827c6739a80c360ccc326,0x0b8428004ab7fea256dbc6e7c6412381cb173e8a,0.6,0.618181,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-04-09 16:43:47.000000 UTC,14.0,0.790008,365,0x64a1c0937728d8d2fa8cd81ef61a9c860b7362db,nftfi,1058.6076,False,16912865,p2p,30522,2
6,0xd5f969b32332020a8e7129e4aa2f20a5bff446b31e00...,2023-03-26 16:43:11.000000 UTC,30521,0x48cf6acbcba1c8fe470827c6739a80c360ccc326,0x0b8428004ab7fea256dbc6e7c6412381cb173e8a,0.6,0.618181,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-04-09 16:43:11.000000 UTC,14.0,0.790008,323,0x64a1c0937728d8d2fa8cd81ef61a9c860b7362db,nftfi,1058.6076,False,16912862,p2p,30521,2
7,0xd5f969b32332020a8e7129e4aa2f20a5bff446b31e00...,2023-03-26 16:43:11.000000 UTC,30521,0x48cf6acbcba1c8fe470827c6739a80c360ccc326,0x0b8428004ab7fea256dbc6e7c6412381cb173e8a,0.6,0.618181,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-04-09 16:43:11.000000 UTC,14.0,0.790008,323,0x64a1c0937728d8d2fa8cd81ef61a9c860b7362db,nftfi,1058.6076,False,16912862,p2p,30521,2
8,0xb45fb78243aa6c0420fbb40e2c8cd1cf420eb914d003...,2022-03-20 17:57:17.000000 UTC,-5752,0x6744a9c6e3a9b8f7243ace5b20d51a500fcd0353,0xdef310bddbd0e2a524775505a134a86b6a583a6b,0.75,0.77589,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-03 17:57:17.000000 UTC,14.0,0.9,15130,0x86c10d10eca1fca9daf87a279abccabe0063f247,nftfi,2137.879425,False,14424722,p2p,5752,2
9,0xb45fb78243aa6c0420fbb40e2c8cd1cf420eb914d003...,2022-03-20 17:57:17.000000 UTC,-5752,0x6744a9c6e3a9b8f7243ace5b20d51a500fcd0353,0xdef310bddbd0e2a524775505a134a86b6a583a6b,0.75,0.77589,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-03 17:57:17.000000 UTC,14.0,0.9,15130,0x86c10d10eca1fca9daf87a279abccabe0063f247,nftfi,2137.879425,False,14424722,p2p,5752,2


28611.210136

Are loan_id_cleaned unique? Once grouped by loan_id_cleaned, the counts are: 


array([1, 2, 3])

In [13]:
print(f"duplicate lines in MQ dataset {mq.shape[0] - mq.drop_duplicates().shape[0]}")
print(f"duplicate lines in nftfi dataset {nftfi.shape[0] - nftfi.drop_duplicates().shape[0]}")

duplicate lines in MQ dataset 8
duplicate lines in nftfi dataset 0


## Clean raw NFTfi dataset

In [60]:
# nftfi.dtypes

In [15]:
nftfi['date'] = pd.to_datetime(nftfi['date'], format="%Y-%m-%d %H:%M:%S%z")
nftfi['loan_start_time'] = pd.to_datetime(nftfi['loan_start_time'], format="%Y-%m-%d %H:%M:%S%z")
nftfi['loan_repaid_time'] = pd.to_datetime(nftfi['loan_repaid_time'], format="%Y-%m-%d %H:%M:%S%z")

# Remove invalid values
nftfi.replace(r"#DIV/0!", np.nan, regex=True, inplace=True)
nftfi.replace(r"#N/A", "", regex=True, inplace=True)

# Divide loanPrincipalAmount and maximumRepaymentAmount by ETH <> WEI i.e. 1^18
columns_to_clean = ['loan_principal_amount', 'maximum_repayment_amount', 'maximum_repayment_amount']
for col in columns_to_clean:
    nftfi[col] = nftfi[col].astype(np.float64)
    nftfi[col] /= 10 ** 18
# nftfi['no_of_days'] = nftfi['no_of_days'].astype(np.float64)
nftfi = nftfi.rename(columns={'loan_apr': 'apr'})
nftfi['apr'] = nftfi['apr'].astype(np.float64)

# Drop last column as it is unnamed
nftfi = nftfi.drop('', axis=1, errors='ignore')

# set BOOL columns to bool type
cols = ['repaid', 'liquidated']
nftfi['repaid'] = nftfi['repaid'].fillna(False)
nftfi['repaid'] = nftfi['repaid'].replace('', False)
for col in cols:
    # nftfi[col] = nftfi[col].astype('boolean')
    nftfi[col] = nftfi[col].map({'True': True, 'False': False})
    nftfi[col] = nftfi[col].astype(bool)
nftfi['repaid'] = nftfi['repaid'].astype(bool)

## Enrich datasets

In [16]:
# Enrich dataset with ETHUSD rate i.e. ETHPrice, then fill USDValue for USDValue from loanERC20Denomination == weth_address
weth_address = '0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2'.lower()
price_df = pd.read_csv('../analytics_bot_langchain/data/nftfi/eth_usd_input_data.csv')
price_df = price_df.rename(columns={'datetime': 'date'})
price_df['date'] = pd.to_datetime(price_df['date'], format='%Y-%m-%d %H:%M:%S%z')
price_df = price_df.drop(columns=['open', 'low', 'volume'])

nftfi['date'] = pd.to_datetime(nftfi['date'])
nftfi['loan_principal_amount'] = nftfi['loan_principal_amount'].astype(float)

nftfi = nftfi.sort_values(by='date')
price_df = price_df.sort_values(by='date')

nftfi = pd.merge_asof(nftfi, price_df, on='date', direction='backward')
nftfi['eth_price'] = nftfi['close']
nftfi = nftfi.drop(columns=['close'])
nftfi['loan_erc20denomination'] = nftfi['loan_erc20denomination'].astype(str).str.lower().str.strip()
nftfi.loc[nftfi['loan_erc20denomination'] == weth_address, 'usd_value'] = nftfi.loc[nftfi['loan_erc20denomination'] == weth_address]['loan_principal_amount'] * nftfi.loc[nftfi['loan_erc20denomination'] == weth_address]['eth_price']

# now map missing usd_value, e.g. for stablecoin-denominated loans
usdc_address = '0xA0b86991c6218b36c1d19D4a2e9Eb0cE3606eB48'  # https://etherscan.io/token/0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48
usdt_address = '0xdAC17F958D2ee523a2206206994597C13D831ec7'  # https://etherscan.io/token/0xdac17f958d2ee523a2206206994597c13d831ec7
dai_address = '0x6B175474E89094C44Da98b954EedeAC495271d0F'  # https://etherscan.io/token/0x6b175474e89094c44da98b954eedeac495271d0f
stablecoin_addresses = [usdc_address, usdt_address, dai_address]
for stablecoin_address in stablecoin_addresses:
    stablecoin_address = stablecoin_address.lower()
    nftfi.loc[nftfi['loan_erc20denomination'] == stablecoin_address, 'usd_value'] = nftfi.loc[nftfi['loan_erc20denomination'] == stablecoin_address]['loan_principal_amount']



In [17]:
print('\n\nNFTfi: \n')
print("Are loan_no unique? Once grouped by unique, the counts are: ")
nftfi_loan_no_count = pd.DataFrame(nftfi.groupby('loan_no').agg('count')['borrower'])
duplicated_nftfi_loans = pd.merge(left=nftfi, right=nftfi_loan_no_count.loc[nftfi_loan_no_count['borrower']>1], left_on='loan_no', right_on='loan_no')
display(duplicated_nftfi_loans)
display(duplicated_nftfi_loans.usd_value.sum())

display(nftfi_loan_no_count['borrower'].unique())
display(nftfi_loan_no_count.loc[nftfi_loan_no_count['borrower']>1])

print("Are loan_no_cleaned unique? Once grouped by loan_id_cleaned, the counts are: ")
display(nftfi.groupby('loan_no_cleaned').agg('count')['borrower'].unique())



NFTfi: 

Are loan_no unique? Once grouped by unique, the counts are: 


Unnamed: 0,loan_no,id,loan_contract,status,borrower_x,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,borrower_y


0.0

array([1])

Unnamed: 0_level_0,borrower
loan_no,Unnamed: 1_level_1


Are loan_no_cleaned unique? Once grouped by loan_id_cleaned, the counts are: 


array([1, 2])

## Enrich nftfi table with ERC20 denominations

In [18]:
# Check if it can be due to missing token
usdc_address = '0xA0b86991c6218b36c1d19D4a2e9Eb0cE3606eB48'  # https://etherscan.io/token/0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48
usdt_address = '0xdAC17F958D2ee523a2206206994597C13D831ec7'  # https://etherscan.io/token/0xdac17f958d2ee523a2206206994597c13d831ec7
dai_address = '0x6B175474E89094C44Da98b954EedeAC495271d0F'  # https://etherscan.io/token/0x6b175474e89094c44da98b954eedeac495271d0f
weth_address = '0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2'

stablecoin_addresses = [usdc_address, usdt_address, dai_address, weth_address]

stablecoin_names = ['usdc', 'usdt', 'dai', 'weth']
for stablecoin_address, stablecoin_name in zip(stablecoin_addresses, stablecoin_names):
    stablecoin_address = stablecoin_address.lower()
    nftfi.loc[nftfi['loan_erc20denomination'] == stablecoin_address, 'loan_erc20denomination_name'] = stablecoin_name

In [19]:
# Confirm that the above addresses matches the one available in MQ dataset:
mq.erc20_address.unique()

array(['0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2',
       '0x6b175474e89094c44da98b954eedeac495271d0f',
       '0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48'], dtype=object)

#### Enrich NFTfi table with loan types

In [20]:
nftfi['loan_type'] = nftfi.loan_no.astype(str).str.split('-').apply(lambda x: x[0]+'-'+x[1] if len(x) >2 else x[0])
nftfi['loan_type'].unique()

array(['v1.loan.fixed', 'v2.loan.fixed', 'v2-1.loan.fixed',
       'v2.loan.fixed.collection'], dtype=object)

## Compute April subset for each table

In [21]:
april_mq = mq.loc[mq['block_timestamp'] >= '2023-04-01'].loc[mq['block_timestamp'] < '2023-05-01']
april_mq.shape

(1852, 20)

In [22]:
april_nftfi = nftfi.loc[nftfi['date'] >= '2023-04-01'].loc[nftfi['date'] < '2023-05-01']
april_nftfi.shape

(2784, 44)

#### Check for duplicates

In [23]:
april_nftfi.loc[april_nftfi.loan_no_cleaned.duplicated()== True]

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type


In [24]:
april_mq.loc[april_mq.loan_id_cleaned.duplicated()== True]

Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned


In [25]:
april_nftfi.loc[april_nftfi.loan_no_cleaned.duplicated()== True]

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type


In [26]:
display(april_mq.head(3).sort_values('loan_id_cleaned', ascending=False))
display(april_nftfi.head(3).sort_values('loan_no_cleaned', ascending=False))

Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned
28,0xecaf8a9e276b227506ebc8acc837792370ec83d52e39...,2023-04-28 00:40:35.000000 UTC,34311,0xefa755b82218dc287ed37bf6463c144ae6609076,0x08f6db921b10ce9f7ec4166b9be9dc01a30c34cc,10000.0,10082.191781,0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48,USDc,2023-05-28 00:40:35.000000 UTC,30.0,0.1,6096,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,10000.0,False,17141128,p2p,34311
82,0x2d07d7afcb6324bfc6239c6bcc9bca658a49cd2b227c...,2023-04-27 13:53:47.000000 UTC,34265,0xa35b95b60af5205dbd02571d8d72ef83f79a28af,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,6.0,6.54,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-26 13:53:47.000000 UTC,365.0,0.09,9470,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,11261.0808,False,17137936,p2p,34265
2,0x0f3522aa06eb28b8cceb590ea80cbd335ab64010dab8...,2023-04-02 09:27:59.000000 UTC,31180,0xf7b18e107eb36797f4ce36de756630b9c30969ad,0x31d75becb2fe9cc60eb4877b44110aa1cdae90a5,800.0,826.30137,0x6b175474e89094c44da98b954eedeac495271d0f,DAI,2023-06-01 09:27:59.000000 UTC,60.0,0.2,2118,0x026224a2940bfe258d0dbe947919b62fe321f042,nftfi,800.0,False,16960517,p2p,31180


Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type
37973,v2.loan.fixed.collection-31046,31046,v2.loan.fixed.collection,,0x58463E8ecA64FE736a26d7A2eD95B4Bc6127e268,0x3e60C12997d3Bb062530e5F7e7f0400FBB9aEcA5,0.686,7.019577999999999e-19,30,28.302216,1970-01-01 00:00:01.680310871,2023-04-01 01:01:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950907,0x57bfc3c592f00d6fad19dabbc746cba5ada6d55263bd...,19323776633,476002,466214,17071471,19323776633,True,True,NaT,,,,,,,,,,,,,,,,31046,1821.82,1821.51,1249.55586,weth,v2.loan.fixed.collection
37972,v2-1.loan.fixed-31045,31045,v2-1.loan.fixed,,0x07a2CF3c078D9526Eb50Ba7AFFaBc0049827D126,0x064980edD7D43AbEE781f49A4e31C06Df05EcccB,0.375,4.0273999999999996e-19,30,90.000889,1970-01-01 00:00:01.680308543,2023-04-01 00:22:23+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950714,0xa9ba08c02d21f2431178b2daa9edb4e50416948373e8...,21761128223,466942,461954,9657250,21761128223,True,True,NaT,,,,,,,,,,,,,,,,31045,1827.85,1825.6,684.6,weth,v2-1.loan.fixed
37971,v2-1.loan.fixed-31044,31044,v2-1.loan.fixed,repaid,0x371267a1863080c5F39229183350e0D87d39743E,0x9CD074f0192BB2A477DA3271bA03db4fc5cD38c7,2.6,2.685458e-18,30,39.989962,1970-01-01 00:00:01.680307511,2023-04-01 00:05:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950628,0x18c7c39e8fdb35cd976872d05263f92e34d9e8b5825c...,26393453389,539029,524441,5046898,26393453389,True,True,2023-04-24 09:17:59+00:00,2.6811851e+18,0xb0ca08e743122d22d09806ba5850cda85f605dee5bfc...,38753230000.0,454254.0,240516.0,2481228.0,38753230000.0,4272900000000000.0,,,,,,,,31044,1824.45,1823.42,4740.892,weth,v2-1.loan.fixed


In [27]:
# Determine the set of unique IDs present in MQ and not in NFTfi
len(set(list(april_mq.loan_id_cleaned)) - set(list(april_nftfi.loan_no_cleaned)))

430

In [28]:
# Determine the set of unique IDs present in NFTfi and not in MQ's
len(set(list(april_nftfi.loan_no_cleaned)) - set(list(april_mq.loan_id_cleaned)))

1362

In [29]:
april_mq.shape, april_nftfi.shape

((1852, 20), (2784, 44))

In [30]:
april_nftfi.shape[0] - april_mq.shape[0]

932

## Compute which Loans are available in NFTfi's and not in MQ's, and the converse, by matching on transaction hashes

In [33]:
# how do i get all rows in df1 that are not in df2
# and all rows in df2 that are not in df1?

# Perform a full outer join on df1 and df2
full_outer = pd.merge(april_nftfi, april_mq, how='outer', on='transaction_hash', indicator=True)

# Filter out the rows that are unique to df1
unique_to_april_nftfi = full_outer[full_outer['_merge'] == 'left_only']

# Filter out the rows that are unique to df2
unique_to_april_mq = full_outer[full_outer['_merge'] == 'right_only']


In [34]:
print(f"number of loans unique to NFTfi relative to MQ in April 2023: {unique_to_april_nftfi.shape[0]}, i.e. {100 * round(unique_to_april_nftfi.shape[0] / april_nftfi.shape[0], 2)}%")
print(f"while in April 2023 NFTfi had {april_nftfi.shape[0]} loans while mq had {april_mq.shape[0]}, i.e. for April NFTfi has {april_nftfi.shape[0] - april_mq.shape[0]} more loans")
display(unique_to_april_nftfi.shape[0])
display(unique_to_april_nftfi.head(2))

number of loans unique to NFTfi relative to MQ in April 2023: 1362, i.e. 49.0%
while in April 2023 NFTfi had 2784 loans while mq had 1852, i.e. for April NFTfi has 932 more loans


1362

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr_x,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr_y,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned,_merge
1,v2-1.loan.fixed-31045,31045.0,v2-1.loan.fixed,,0x07a2CF3c078D9526Eb50Ba7AFFaBc0049827D126,0x064980edD7D43AbEE781f49A4e31C06Df05EcccB,0.375,4.0273999999999996e-19,30.0,90.000889,1970-01-01 00:00:01.680308543,2023-04-01 00:22:23+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950714.0,0xa9ba08c02d21f2431178b2daa9edb4e50416948373e8...,21761130000.0,466942.0,461954.0,9657250.0,21761130000.0,True,True,NaT,,,,,,,,,,,,,,,,31045,1827.85,1825.6,684.6,weth,v2-1.loan.fixed,,,,,,,,,,,,,,,,,,,,left_only
2,v2.loan.fixed.collection-31046,31046.0,v2.loan.fixed.collection,,0x58463E8ecA64FE736a26d7A2eD95B4Bc6127e268,0x3e60C12997d3Bb062530e5F7e7f0400FBB9aEcA5,0.686,7.019577999999999e-19,30.0,28.302216,1970-01-01 00:00:01.680310871,2023-04-01 01:01:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950907.0,0x57bfc3c592f00d6fad19dabbc746cba5ada6d55263bd...,19323780000.0,476002.0,466214.0,17071471.0,19323780000.0,True,True,NaT,,,,,,,,,,,,,,,,31046,1821.82,1821.51,1249.55586,weth,v2.loan.fixed.collection,,,,,,,,,,,,,,,,,,,,left_only


In [35]:
print(f"number of loans unique to MQ relative to NFTfi in April 2023: {unique_to_april_mq.shape[0]}, i.e. {100 * round(unique_to_april_mq.shape[0] / april_mq.shape[0], 2)}%")
print(f"while in April 2023 NFTfi had {april_nftfi.shape[0]} loans while mq had {april_mq.shape[0]}, i.e. for April NFTfi has {april_nftfi.shape[0] - april_mq.shape[0]} more loans")

display(unique_to_april_mq.shape[0])
display(unique_to_april_mq.head(2))

number of loans unique to MQ relative to NFTfi in April 2023: 430, i.e. 23.0%
while in April 2023 NFTfi had 2784 loans while mq had 1852, i.e. for April NFTfi has 932 more loans


430

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr_x,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr_y,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned,_merge
2784,,,,,,,,,,,NaT,NaT,,,0xecaf8a9e276b227506ebc8acc837792370ec83d52e39...,,,,,,,,NaT,,,,,,,,,,,,,,,,,,,,,,2023-04-28 00:40:35.000000 UTC,34311.0,0xefa755b82218dc287ed37bf6463c144ae6609076,0x08f6db921b10ce9f7ec4166b9be9dc01a30c34cc,10000.0,10082.191781,0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48,USDc,2023-05-28 00:40:35.000000 UTC,30.0,0.1,6096,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,10000.0,False,17141128.0,p2p,34311,right_only
2785,,,,,,,,,,,NaT,NaT,,,0x2d07d7afcb6324bfc6239c6bcc9bca658a49cd2b227c...,,,,,,,,NaT,,,,,,,,,,,,,,,,,,,,,,2023-04-27 13:53:47.000000 UTC,34265.0,0xa35b95b60af5205dbd02571d8d72ef83f79a28af,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,6.0,6.54,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-26 13:53:47.000000 UTC,365.0,0.09,9470,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,11261.0808,False,17137936.0,p2p,34265,right_only


In [36]:
pd.set_option('display.float_format', '{:,.0f}'.format)
pd.DataFrame(unique_to_april_nftfi.groupby('loan_contract').agg(sum)['usd_value'])

  pd.DataFrame(unique_to_april_nftfi.groupby('loan_contract').agg(sum)['usd_value'])


Unnamed: 0_level_0,usd_value
loan_contract,Unnamed: 1_level_1
v2-1.loan.fixed,5254060
v2.loan.fixed.collection,8974156


In [37]:
mq_loans_not_in_nftfi = list(
        set(list(april_mq.loan_id_cleaned)) - set(list(april_nftfi.loan_no_cleaned))
    )
mq_loans_not_in_nftfi[:5]

['34149', '34246', '33866', '34353', '34240']

In [38]:
len(mq_loans_not_in_nftfi)

430

In [39]:
# MQ loans not in NFTfi
# mq_not_in_nftfi = april_mq[april_mq['loan_id_cleaned'].isin(mq_loans_not_in_nftfi)].reset_index(drop=True)
mq_not_in_nftfi.head(3)

Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr_x,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr_y,loan_start_time,date,loan_erc20denomination,block_num,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type
0,0x0f3522aa06eb28b8cceb590ea80cbd335ab64010dab8...,2023-04-02 09:27:59.000000 UTC,31180,0xf7b18e107eb36797f4ce36de756630b9c30969ad,0x31d75becb2fe9cc60eb4877b44110aa1cdae90a5,800,826,0x6b175474e89094c44da98b954eedeac495271d0f,DAI,2023-06-01 09:27:59.000000 UTC,60,0,2118,0x026224a2940bfe258d0dbe947919b62fe321f042,nftfi,800,False,16960517,p2p,31180,v2-1.loan.fixed-31180,31180.0,v2-1.loan.fixed,,0xF7B18e107eb36797f4cE36dE756630B9C30969ad,0x31d75BeCb2fE9cC60Eb4877B44110aA1CdaE90A5,800.0,0.0,30.0,20.0,1970-01-01 00:00:01.680427679,2023-04-02 09:27:59+00:00,0x6b175474e89094c44da98b954eedeac495271d0f,16960517.0,20274855936.0,551203.0,531815.0,4667879.0,20274855936.0,True,True,NaT,,,,,,,,,,,,,,,,31180.0,1821.0,1821.0,800.0,dai,v2-1.loan.fixed
1,0xecaf8a9e276b227506ebc8acc837792370ec83d52e39...,2023-04-28 00:40:35.000000 UTC,34311,0xefa755b82218dc287ed37bf6463c144ae6609076,0x08f6db921b10ce9f7ec4166b9be9dc01a30c34cc,10000,10082,0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48,USDc,2023-05-28 00:40:35.000000 UTC,30,0,6096,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,10000,False,17141128,p2p,34311,,,,,,,,,,,NaT,NaT,,,,,,,,,,NaT,,,,,,,,,,,,,,,,,,,,,
2,0x2d07d7afcb6324bfc6239c6bcc9bca658a49cd2b227c...,2023-04-27 13:53:47.000000 UTC,34265,0xa35b95b60af5205dbd02571d8d72ef83f79a28af,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,6,7,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-26 13:53:47.000000 UTC,365,0,9470,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,11261,False,17137936,p2p,34265,,,,,,,,,,,NaT,NaT,,,,,,,,,,NaT,,,,,,,,,,,,,,,,,,,,,


In [40]:
# We need to explore this table
mq_not_in_nftfi.erc20_name.unique()

array(['DAI', 'USDc', 'wETH'], dtype=object)

## NFTfi loans not in MQ

In [41]:
nftfi_loans_not_in_mq = list(
        set(list(april_nftfi.loan_no_cleaned)) - set(list(april_mq.loan_id_cleaned))
    )
len(nftfi_loans_not_in_mq)

1362

In [42]:
## LOANS IN NFTFI AND NOT IN MQ
# nftfi_not_in_mq = april_nftfi[april_nftfi['loan_no_cleaned'].isin(nftfi_loans_not_in_mq)].reset_index(drop=True)
nftfi_not_in_mq

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr_x,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr_y,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned
0,v2-1.loan.fixed-31044,31044,v2-1.loan.fixed,repaid,0x371267a1863080c5F39229183350e0D87d39743E,0x9CD074f0192BB2A477DA3271bA03db4fc5cD38c7,3,0,30,40,1970-01-01 00:00:01.680307511,2023-04-01 00:05:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950628,0x18c7c39e8fdb35cd976872d05263f92e34d9e8b5825c...,26393453389,539029,524441,5046898,26393453389,True,True,2023-04-24 09:17:59+00:00,2681185100000000000,0xb0ca08e743122d22d09806ba5850cda85f605dee5bfc...,38753230709,454254,240516,2481228,38753230709,4272900000000000,,,,,,,,31044,1824,1823,4741,weth,v2-1.loan.fixed,2023-04-01 00:05:11.000000 UTC,31044,0x371267a1863080c5f39229183350e0d87d39743e,0x9cd074f0192bb2a477da3271ba03db4fc5cd38c7,3,3,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-05-01 00:05:11.000000 UTC,30,0,17119,0x49cf6f5d44e70224e2e23fdcdd2c053f30ada28b,nftfi,4737,False,16950628,p2p,31044
1,v2-1.loan.fixed-31045,31045,v2-1.loan.fixed,,0x07a2CF3c078D9526Eb50Ba7AFFaBc0049827D126,0x064980edD7D43AbEE781f49A4e31C06Df05EcccB,0,0,30,90,1970-01-01 00:00:01.680308543,2023-04-01 00:22:23+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950714,0xa9ba08c02d21f2431178b2daa9edb4e50416948373e8...,21761128223,466942,461954,9657250,21761128223,True,True,NaT,,,,,,,,,,,,,,,,31045,1828,1826,685,weth,v2-1.loan.fixed,,,,,,,,,,,,,,,,,,,
2,v2.loan.fixed.collection-31046,31046,v2.loan.fixed.collection,,0x58463E8ecA64FE736a26d7A2eD95B4Bc6127e268,0x3e60C12997d3Bb062530e5F7e7f0400FBB9aEcA5,1,0,30,28,1970-01-01 00:00:01.680310871,2023-04-01 01:01:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950907,0x57bfc3c592f00d6fad19dabbc746cba5ada6d55263bd...,19323776633,476002,466214,17071471,19323776633,True,True,NaT,,,,,,,,,,,,,,,,31046,1822,1822,1250,weth,v2.loan.fixed.collection,,,,,,,,,,,,,,,,,,,
3,v2-1.loan.fixed-31047,31047,v2-1.loan.fixed,repaid,0xCd8826a0298cfCd4eeB3a0c118a8aa664316Cd7A,0xBbB589796d01EF05f24C49f57d53125d4382ab62,1,0,7,55,1970-01-01 00:00:01.680310979,2023-04-01 01:02:59+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950915,0x6dc7560b2f2d22ad29d1009f2e2c27ff50522d7f0a2a...,19546172958,498655,493667,7247311,19546172958,True,True,2023-04-14 22:58:23+00:00,1224049250000000000,0x11869c955df36d7cbca9e01418f775bcf9ff363741de...,27869791665,406804,215209,992838,27869791665,1265750000000000,,,,,,,,31047,1822,1822,2186,weth,v2-1.loan.fixed,2023-04-01 01:02:59.000000 UTC,31047,0xcd8826a0298cfcd4eeb3a0c118a8aa664316cd7a,0xbbb589796d01ef05f24c49f57d53125d4382ab62,1,1,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-04-15 01:02:59.000000 UTC,14,1,9517,0x5946aeaab44e65eb370ffaa6a7ef2218cff9b47d,nftfi,2188,False,16950915,p2p,31047
4,v2.loan.fixed.collection-31048,31048,v2.loan.fixed.collection,,0x3b7393118f0d8f99f269854CF441A5ebCb0Af246,0x591EC71097d9Fda67cF53732239F9591688f37E9,1,0,30,60,1970-01-01 00:00:01.680316595,2023-04-01 02:36:35+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16951376,0x214898bcb85badfe65864f93faeb933afa8792b23fff...,23602727755,503689,489101,10647808,23602727755,True,True,NaT,,,,,,,,,,,,,,,,31048,1828,1825,1642,weth,v2.loan.fixed.collection,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2779,v2-1.loan.fixed-33820,33820,v2-1.loan.fixed,,0xBeC69dfcE4c1fA8b7843FEE1Ca85788d84A86B06,0xc3cea12ffda8B3Dff435155461de6FCc72315117,0,0,30,69,1970-01-01 00:00:01.682364203,2023-04-24 19:23:23+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17118198,0xd72a47b553f0125bc8ef9ff93fca570d0031a53fe44a...,49000000000,470680,465692,6148167,49000000000,True,True,NaT,,,,,,,,,,,,,,,,33820,1831,1829,915,weth,v2-1.loan.fixed,,,,,,,,,,,,,,,,,,,
2780,v2-1.loan.fixed-33824,33824,v2-1.loan.fixed,,0x353D1aF0fA732F6230Ff4ab0eB2a6A3Dcf4C54F2,0x1797b4235473fbE0e7e44322F01C1B5618EBda41,7,0,365,9,1970-01-01 00:00:01.682364971,2023-04-24 19:36:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17118262,0x862834c19fc5e3255d85ee631d45b38c210055fb8aa8...,55983293990,528871,509483,9778066,55983293990,True,True,NaT,,,,,,,,,,,,,,,,33824,1833,1832,12824,weth,v2-1.loan.fixed,2023-04-24 19:36:11.000000 UTC,33824,0x353d1af0fa732f6230ff4ab0eb2a6a3dcf4c54f2,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,7,8,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-23 19:36:11.000000 UTC,365,0,3903,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,12821,False,17118262,p2p,33824
2781,v2-1.loan.fixed-33825,33825,v2-1.loan.fixed,,0xD758bf1da4B9683454b97988175aa6F9419c2B39,0x1797b4235473fbE0e7e44322F01C1B5618EBda41,7,0,365,9,1970-01-01 00:00:01.682366579,2023-04-24 20:02:59+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17118392,0x0f94288dd02f42bb2a38bbacffb8c8d7afa8c7519f8d...,48923952650,528891,509503,16206666,48923952650,True,True,NaT,,,,,,,,,,,,,,,,33825,1836,1836,12851,weth,v2-1.loan.fixed,2023-04-24 20:02:59.000000 UTC,33825,0xd758bf1da4b9683454b97988175aa6f9419c2b39,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,7,8,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-23 20:02:59.000000 UTC,365,0,795,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,12819,False,17118392,p2p,33825
2782,v2.loan.fixed.collection-33826,33826,v2.loan.fixed.collection,,0x739dEB8B1232BF13687c0607dd3035E983b3f56F,0xe9bAB3816a139827fE218D58699097B359680380,2,0,14,79,1970-01-01 00:00:01.682367131,2023-04-24 20:12:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17118438,0x49a1183d64fa141041920c35ee637713bc411390f112...,56169185321,512105,502317,12210820,56169185321,True,True,NaT,,,,,,,,,,,,,,,,33826,1839,1838,4137,weth,v2.loan.fixed.collection,,,,,,,,,,,,,,,,,,,


In [43]:
# Explore the resulting set of nftfi_not_in_mq. Is there any pattern?
nftfi_not_in_mq.describe()

Unnamed: 0,id,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr_x,block_num,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,high,eth_price,usd_value,loan_id,principal_amount,repayment_amount,duration_in_days,apr_y,amt_in_usd,block_number
count,2784,2784,2784,2784,2784,2784,2784,2784,2784,2784,2784,494,494,494,494,494,265,265,265,265,265,2784,2784,2784,1422,1422,1422,1422,1422,1422,1422
mean,32436,1206,0,29,52,17032597,30576111122,501913,486009,11214634,30576111122,34669794963,409011,216708,6353557,34669794963,45402104291,517582,179911,6360596,45402104291,1927,1926,6856,32433,289,298,33,0,3471,17032664
std,804,7437,0,39,35,46747,12923017372,68596,29331,5761207,12923017372,15000096631,49175,21792,6073457,15000096631,12516144261,951731,31950,4368854,12516144261,101,101,18951,827,1736,1793,52,0,5434,48343
min,31044,0,0,1,0,16950628,15840527982,449404,439616,474677,15840527982,18825273282,266788,185436,348367,18825273282,19116326214,202882,160556,566241,19116326214,1776,1775,0,31044,0,0,3,0,18,16950628
25%,31740,0,0,14,29,16992504,21577190703,470481,463202,7437193,21577190703,24210609004,375816,199394,2204403,24210609004,37307097371,304323,160556,3691044,37307097371,1857,1856,778,31745,0,0,14,0,765,16992636
50%,32436,1,0,30,49,17029126,26114680192,494964,485078,10221288,26114680192,29000000000,392698,208591,3898013,29000000000,45560881573,304323,160556,5131213,45560881573,1892,1891,1419,32364,1,1,30,0,1657,17025498
75%,33131,3,0,30,70,17069743,35817050548,522432,507749,13740146,35817050548,39809426483,439932,232878,8496101,39809426483,54946767423,370306,195747,7715615,54946767423,1985,1983,4009,33188,2,2,30,1,2999,17074250
max,33827,65000,0,371,299,17118481,111844547450,2127032,624659,29910369,111844547450,98131606435,957728,335420,29181971,98131606435,91057207396,5300000,312532,26794702,91057207396,2133,2133,360029,33825,35000,36392,371,3,76639,17118392


### Are discrepancies due to loan type which is not accounted for?

In [44]:
# How about loan numbers, how do they vary from a naming standpoint?
# x[0]+x[1] if len(x) >2 else x[0] is such that it returns "v2-1.loan.fixed" from "v2-1.loan.fixed-32381", 
#    else returns "v2.loan.fixed.collection" from "v2.loan.fixed.collection-34479"

nftfi_not_in_mq.loan_no.astype(str).str.split('-').apply(lambda x: x[0]+'-'+x[1] if len(x) >2 else x[0]).unique()
# it seems from the above result that [v2-1.loan.fixed', 'v2.loan.fixed.collection'] are the two loan types which are not accounted for

array(['v2-1.loan.fixed', 'v2.loan.fixed.collection'], dtype=object)

In [45]:
# Is the above true as well for the whole table set?
nftfi_loans_not_in_mq = list(
        set(list(nftfi.loan_no_cleaned)) - set(list(mq.loan_id_cleaned))
    )
print(len(nftfi_loans_not_in_mq))
# How about loan numbers, how do they vary from a naming standpoint?
# x[0]+x[1] if len(x) >2 else x[0] is such that it returns "v2-1.loan.fixed" from "v2-1.loan.fixed-32381", 
#    else returns "v2.loan.fixed.collection" from "v2.loan.fixed.collection-34479"

nftfi_not_in_mq.loan_no.astype(str).str.split('-').apply(lambda x: x[0]+'-'+x[1] if len(x) >2 else x[0]).unique()
# it seems from the above result that [v2-1.loan.fixed', 'v2.loan.fixed.collection'] are the two loan types which are not accounted for

14989


array(['v2-1.loan.fixed', 'v2.loan.fixed.collection'], dtype=object)

### Is it due to missed erc20 token denomination?

In [46]:
# Check if it can be due to missing token
usdc_address = '0xA0b86991c6218b36c1d19D4a2e9Eb0cE3606eB48'  # https://etherscan.io/token/0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48
usdt_address = '0xdAC17F958D2ee523a2206206994597C13D831ec7'  # https://etherscan.io/token/0xdac17f958d2ee523a2206206994597c13d831ec7
dai_address = '0x6B175474E89094C44Da98b954EedeAC495271d0F'  # https://etherscan.io/token/0x6b175474e89094c44da98b954eedeac495271d0f
weth_address = '0xC02aaA39b223FE8D0A0e5C4F27eAD9083C756Cc2'

stablecoin_addresses = [usdc_address, usdt_address, dai_address, weth_address]

stablecoin_names = ['usdc', 'usdt', 'dai', 'weth']
for stablecoin_address, stablecoin_name in zip(stablecoin_addresses, stablecoin_names):
    stablecoin_address = stablecoin_address.lower()
    nftfi_not_in_mq.loc[nftfi_not_in_mq['loan_erc20denomination'] == stablecoin_address, 'loan_erc20denomination_name'] = stablecoin_name

In [47]:
nftfi_not_in_mq.loan_erc20denomination_name.unique()
# It does not seem to be linked to missing token.

array(['weth', 'usdc', 'dai'], dtype=object)

### Let's compute loan volumes per token denomination to see if they match

In [48]:
display(april_nftfi.head(2))
display(april_mq.head(2))

Unnamed: 0,loan_no,id,loan_contract,status,borrower,lender,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,loan_start_time,date,loan_erc20denomination,block_num,transaction_hash,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,loan_repaid_time,repaid_amount_paid_to_lender,repaid_transaction_hash,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,repaid_admin_fee,loan_liquidation_date,liquidated_transaction_hash,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,loan_no_cleaned,high,eth_price,usd_value,loan_erc20denomination_name,loan_type
37971,v2-1.loan.fixed-31044,31044,v2-1.loan.fixed,repaid,0x371267a1863080c5F39229183350e0D87d39743E,0x9CD074f0192BB2A477DA3271bA03db4fc5cD38c7,3,0,30,40,1970-01-01 00:00:01.680307511,2023-04-01 00:05:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950628,0x18c7c39e8fdb35cd976872d05263f92e34d9e8b5825c...,26393453389,539029,524441,5046898,26393453389,True,True,2023-04-24 09:17:59+00:00,2.6811851e+18,0xb0ca08e743122d22d09806ba5850cda85f605dee5bfc...,38753230709.0,454254.0,240516.0,2481228.0,38753230709.0,4272900000000000.0,,,,,,,,31044,1824,1823,4741,weth,v2-1.loan.fixed
37972,v2-1.loan.fixed-31045,31045,v2-1.loan.fixed,,0x07a2CF3c078D9526Eb50Ba7AFFaBc0049827D126,0x064980edD7D43AbEE781f49A4e31C06Df05EcccB,0,0,30,90,1970-01-01 00:00:01.680308543,2023-04-01 00:22:23+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,16950714,0xa9ba08c02d21f2431178b2daa9edb4e50416948373e8...,21761128223,466942,461954,9657250,21761128223,True,True,NaT,,,,,,,,,,,,,,,,31045,1828,1826,685,weth,v2-1.loan.fixed


Unnamed: 0,transaction_hash,block_timestamp,loan_id,to_address,from_address,principal_amount,repayment_amount,erc20_address,erc20_name,due_date,duration_in_days,apr,token_id,collection_address,protocol,amt_in_usd,roll_over,block_number,p2p_p2pool,loan_id_cleaned
2,0x0f3522aa06eb28b8cceb590ea80cbd335ab64010dab8...,2023-04-02 09:27:59.000000 UTC,31180,0xf7b18e107eb36797f4ce36de756630b9c30969ad,0x31d75becb2fe9cc60eb4877b44110aa1cdae90a5,800,826,0x6b175474e89094c44da98b954eedeac495271d0f,DAI,2023-06-01 09:27:59.000000 UTC,60,0,2118,0x026224a2940bfe258d0dbe947919b62fe321f042,nftfi,800,False,16960517,p2p,31180
28,0xecaf8a9e276b227506ebc8acc837792370ec83d52e39...,2023-04-28 00:40:35.000000 UTC,34311,0xefa755b82218dc287ed37bf6463c144ae6609076,0x08f6db921b10ce9f7ec4166b9be9dc01a30c34cc,10000,10082,0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48,USDc,2023-05-28 00:40:35.000000 UTC,30,0,6096,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,10000,False,17141128,p2p,34311


In [49]:
import warnings
warnings.simplefilter(action='ignore', category=FutureWarning)
pd.set_option('display.float_format', '{:,.2f}'.format)
display(april_nftfi.groupby('loan_erc20denomination_name').agg('sum'))

display(april_mq.groupby('erc20_name').agg('sum'))


Unnamed: 0_level_0,id,loan_principal_amount,maximum_repayment_amount,loan_duration_d,apr,block_num,gas_price,gas_limit,gas_used,cumulative_gas_used,effective_gas_price,repaid,liquidated,repaid_gas_price,repaid_gas_limit,repaid_gas_used,repaid_cumulative_gas_used,repaid_effective_gas_price,liquidated_gas_price,liquidated_gas_limit,liquidated_gas_used,liquidated_cumulative_gas_used,liquidated_effective_gas_price,high,eth_price,usd_value
loan_erc20denomination_name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1
dai,6594977,3350375.71,0.0,5968,6054.41,3458304699,6832966278316,103456648,100375684,2353757822,6832966278316,203,203,769162008701.0,10835521.0,5725645.0,190423346.0,769162008701.0,21235263805.0,335454.0,177159.0,6848085.0,21235263805.0,390801.69,390569.03,3350375.71
usdc,2453169,0.0,0.0,2640,3896.08,1278656120,2807403673316,39417988,38646194,991095083,2807403673316,75,75,186589305863.0,2599827.0,1376511.0,40229807.0,186589305863.0,0.0,0.0,0.0,0.0,0.0,146504.09,146396.44,0.0
weth,81252286,8183.79,0.0,72342,135582.41,42681789444,75483523412806,1254451253,1214026491,27876688741,75483523412806,2506,2506,16171127396980.0,188615897.0,99951744.0,2908004194.0,16171127396980.0,12010322373414.0,136823706.0,47499156.0,1678709938.0,12010322373414.0,4828052.68,4825026.23,15736525.8


Unnamed: 0_level_0,loan_id,principal_amount,repayment_amount,duration_in_days,apr,amt_in_usd,roll_over,block_number
erc20_name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
DAI,4191128,394685.88,405500.21,3675.0,42.73,394685.88,0,2182533702
USDc,1978300,451556.0,456643.87,1653.0,22.86,451556.0,0,1008723705
wETH,54665173,2977.71,3074.87,54582.0,812.65,5676459.91,0,28398510161


In [50]:

print("NFTfi:")
display(pd.DataFrame(april_nftfi.groupby('loan_erc20denomination_name').agg('sum')['loan_principal_amount']))
print("\n\nMQ:")
display(pd.DataFrame(april_mq.groupby('erc20_name').agg('sum')['principal_amount']))

NFTfi:


Unnamed: 0_level_0,loan_principal_amount
loan_erc20denomination_name,Unnamed: 1_level_1
dai,3350375.71
usdc,0.0
weth,8183.79




MQ:


Unnamed: 0_level_0,principal_amount
erc20_name,Unnamed: 1_level_1
DAI,394685.88
USDc,451556.0
wETH,2977.71


#### We see from the above results that NFTfi and MQ respective loan principal amounts grouped by the loan erc20 denomination do not match at all. How about the total dollar numbers?

In [51]:
print("NFTfi:")
total_usd_nftfi_volume_per_ccy = pd.DataFrame(april_nftfi.groupby('loan_erc20denomination_name').agg('sum')['usd_value'])
display(total_usd_nftfi_volume_per_ccy)
print("\n\nMQ:")
total_usd_mq_volume_per_ccy = pd.DataFrame(april_mq.groupby('erc20_name').agg('sum')['amt_in_usd'])
display(total_usd_mq_volume_per_ccy)

NFTfi:


Unnamed: 0_level_0,usd_value
loan_erc20denomination_name,Unnamed: 1_level_1
dai,3350375.71
usdc,0.0
weth,15736525.8




MQ:


Unnamed: 0_level_0,amt_in_usd
erc20_name,Unnamed: 1_level_1
DAI,394685.88
USDc,451556.0
wETH,5676459.91


#### Total numbers are very off. Can that be explained with the set of loans which are not in each dataset?

In [52]:
print("Total dollar value of loan principal for NFTfi loans which are not in MQ, for April and NFTfi:")
display(pd.DataFrame(nftfi_not_in_mq.groupby('loan_erc20denomination_name').agg('sum')['usd_value']))
print("\n\nTotal dollar value of loan principal for MQ loans which are not inNFtfi, for April and MQ:")
display(pd.DataFrame(mq_not_in_nftfi.groupby('erc20_name').agg('sum')['amt_in_usd']))

Total dollar value of loan principal for NFTfi loans which are not in MQ, for April and NFTfi:


Unnamed: 0_level_0,usd_value
loan_erc20denomination_name,Unnamed: 1_level_1
dai,3350375.71
usdc,0.0
weth,15736525.8




Total dollar value of loan principal for MQ loans which are not inNFtfi, for April and MQ:


Unnamed: 0_level_0,amt_in_usd
erc20_name,Unnamed: 1_level_1
DAI,394685.88
USDc,451556.0
wETH,5676459.91


In [53]:
usd_values_of_nftfi_not_in_mq = pd.DataFrame(nftfi_not_in_mq.groupby('loan_erc20denomination_name').agg('sum')['usd_value'])
usd_values_of_mq_not_in_nftfi = pd.DataFrame(mq_not_in_nftfi.groupby('erc20_name').agg('sum')['amt_in_usd'])

In [54]:
weth_usd_amount_nftfi_not_in_mq = usd_values_of_nftfi_not_in_mq.loc['weth'].values[0]
weth_usd_amount_mq_not_in_nftfi = usd_values_of_mq_not_in_nftfi.loc['wETH'].values[0]

weth_usd_amount_total_nftfi = total_usd_nftfi_volume_per_ccy.loc['weth'].values[0]
weth_usd_amount_total_mq = total_usd_mq_volume_per_ccy.loc['wETH'].values[0]

print(weth_usd_amount_total_nftfi, weth_usd_amount_nftfi_not_in_mq, weth_usd_amount_mq_not_in_nftfi, weth_usd_amount_total_mq)

# total NFTfi missing from MQ volume, minus total MQ volume missing from NFTfi

weth_usd_amount_nftfi_not_in_mq - weth_usd_amount_mq_not_in_nftfi - weth_usd_amount_total_nftfi  + weth_usd_amount_total_mq

15736525.796682782 15736525.796682782 5676459.911920467 5676459.911920467


0.0

#### How about dollar amounts PER loan type PER ccy?

In [55]:
usd_values_of_nftfi_not_in_mq = pd.DataFrame(nftfi_not_in_mq.groupby(['loan_erc20denomination_name','loan_type']).agg('sum')['usd_value'])
usd_values_of_nftfi_not_in_mq

Unnamed: 0_level_0,Unnamed: 1_level_0,usd_value
loan_erc20denomination_name,loan_type,Unnamed: 2_level_1
dai,v2-1.loan.fixed,1133987.41
dai,v2.loan.fixed.collection,2216388.29
usdc,v2-1.loan.fixed,0.0
usdc,v2.loan.fixed.collection,0.0
weth,v2-1.loan.fixed,6656293.63
weth,v2.loan.fixed.collection,9080232.17


In [56]:
print("NFTfi:")
display(total_usd_nftfi_volume_per_ccy)
print("\n\nMQ:")
display(total_usd_mq_volume_per_ccy)

NFTfi:


Unnamed: 0_level_0,usd_value
loan_erc20denomination_name,Unnamed: 1_level_1
dai,3350375.71
usdc,0.0
weth,15736525.8




MQ:


Unnamed: 0_level_0,amt_in_usd
erc20_name,Unnamed: 1_level_1
DAI,394685.88
USDc,451556.0
wETH,5676459.91


## For the loan IDs which do match... are they the same loans?

In [57]:
import copy
nftfi_with_col_prefix = copy.deepcopy(nftfi)
mq_with_col_prefix = copy.deepcopy(mq)
nftfi_with_col_prefix = nftfi_with_col_prefix.rename(columns={col: 'nftfi_'+ col for col in nftfi.columns})
mq_with_col_prefix = mq_with_col_prefix.rename(columns={col: 'mq_'+ col for col in mq.columns})

matching_mq_with_nftfi = pd.merge(left=nftfi_with_col_prefix, right=mq_with_col_prefix, left_on='nftfi_loan_no_cleaned', right_on='mq_loan_id_cleaned', how='inner', suffixes=('nftfi', 'mq'))
matching_mq_with_nftfi

Unnamed: 0,nftfi_loan_no,nftfi_id,nftfi_loan_contract,nftfi_status,nftfi_borrower,nftfi_lender,nftfi_loan_principal_amount,nftfi_maximum_repayment_amount,nftfi_loan_duration_d,nftfi_apr,nftfi_loan_start_time,nftfi_date,nftfi_loan_erc20denomination,nftfi_block_num,nftfi_transaction_hash,nftfi_gas_price,nftfi_gas_limit,nftfi_gas_used,nftfi_cumulative_gas_used,nftfi_effective_gas_price,nftfi_repaid,nftfi_liquidated,nftfi_loan_repaid_time,nftfi_repaid_amount_paid_to_lender,nftfi_repaid_transaction_hash,nftfi_repaid_gas_price,nftfi_repaid_gas_limit,nftfi_repaid_gas_used,nftfi_repaid_cumulative_gas_used,nftfi_repaid_effective_gas_price,nftfi_repaid_admin_fee,nftfi_loan_liquidation_date,nftfi_liquidated_transaction_hash,nftfi_liquidated_gas_price,nftfi_liquidated_gas_limit,nftfi_liquidated_gas_used,nftfi_liquidated_cumulative_gas_used,nftfi_liquidated_effective_gas_price,nftfi_loan_no_cleaned,nftfi_high,nftfi_eth_price,nftfi_usd_value,nftfi_loan_erc20denomination_name,nftfi_loan_type,mq_transaction_hash,mq_block_timestamp,mq_loan_id,mq_to_address,mq_from_address,mq_principal_amount,mq_repayment_amount,mq_erc20_address,mq_erc20_name,mq_due_date,mq_duration_in_days,mq_apr,mq_token_id,mq_collection_address,mq_protocol,mq_amt_in_usd,mq_roll_over,mq_block_number,mq_p2p_p2pool,mq_loan_id_cleaned
0,v1.loan.fixed-1,1,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,0.00,0.00,7,173.81,1970-01-01 00:00:01.589623507,2020-05-16 10:05:07+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,10076484,0x937a5320404c0c835f2739c84b229ef837a9f0b0ef92...,19755020080,500000,441106,9710213,19755020080,True,True,2020-05-16 11:50:26+00:00,3095000000000000,0x59d1c26160b7bdde716b380364b506e056d852ac1b36...,16974493487.00,500000.00,122603.00,9470068.00,16974493487.00,5000000000000,,,,,,,,1,,,,weth,v1.loan.fixed,0x166d57a868ae6c3e34c192546aedc243eda0c7ba6685...,2022-03-30 10:21:32.000000 UTC,1,0x3e3b47b5d433be4708a6bd524facd48bb54d10b1,0xd79275564ccad8e679cbbb5e1c2facd46643a372,0.01,0.01,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-13 10:21:32.000000 UTC,14.00,0.10,1000323,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,33.89,False,14487024,p2p,1
1,v2.loan.fixed-1,1,v2.loan.fixed,repaid,0x3e3B47b5d433bE4708A6BD524faCd48Bb54D10b1,0xd79275564CCAd8E679cbBb5E1C2FaCD46643a372,0.01,0.00,14,9.91,1970-01-01 00:00:01.648635692,2022-03-30 10:21:32+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,14487024,0x166d57a868ae6c3e34c192546aedc243eda0c7ba6685...,33892599088,840378,540864,5140379,33892599088,True,True,2022-03-30 10:27:49+00:00,10036100000000000,0xed765e1584d0588c100167ea8614e54681ac7b525fb0...,28938564954.00,471039.00,249468.00,9338789.00,28938564954.00,1900000000000,,,,,,,,1,3396.32,3394.93,33.95,weth,v2.loan.fixed,0x166d57a868ae6c3e34c192546aedc243eda0c7ba6685...,2022-03-30 10:21:32.000000 UTC,1,0x3e3b47b5d433be4708a6bd524facd48bb54d10b1,0xd79275564ccad8e679cbbb5e1c2facd46643a372,0.01,0.01,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-13 10:21:32.000000 UTC,14.00,0.10,1000323,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,33.89,False,14487024,p2p,1
2,v1.loan.fixed-2,2,v1.loan.fixed,repaid,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0.03,0.00,7,17.38,1970-01-01 00:00:01.589628655,2020-05-16 11:30:55+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,10076867,0xf331e9fb8341f1b644e0edfe599a56402836808b2570...,12100000000,500000,403060,9269753,12100000000,True,True,2020-05-16 12:20:16+00:00,30095000000000000,0xfa036df32071d8b4f301b34aa2893bc0499db7e79bf1...,13200000144.00,500000.00,132834.00,4140219.00,13200000144.00,5000000000000,,,,,,,,2,,,,weth,v1.loan.fixed,0x9d783e3bbde1663ffa2dcc0bf5eabeccbe3f58475938...,2022-03-30 10:36:00.000000 UTC,2,0x3e3b47b5d433be4708a6bd524facd48bb54d10b1,0xd79275564ccad8e679cbbb5e1c2facd46643a372,0.01,0.01,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-13 10:36:00.000000 UTC,14.00,0.10,735355,0x06012c8cf97bead5deae237070f9587f8e7a266d,nftfi,33.89,False,14487091,p2p,2
3,v2.loan.fixed-2,2,v2.loan.fixed,repaid,0x3e3B47b5d433bE4708A6BD524faCd48Bb54D10b1,0xd79275564CCAd8E679cbBb5E1C2FaCD46643a372,0.01,0.00,14,9.91,1970-01-01 00:00:01.648636560,2022-03-30 10:36:00+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,14487091,0x9d783e3bbde1663ffa2dcc0bf5eabeccbe3f58475938...,24769994524,757849,490645,7281728,24769994524,True,True,2022-03-30 10:36:56+00:00,10036100000000000,0x2d6415762da5c2fc90dcfd4a7f0c19e30c57b45ae480...,30247267592.00,398226.00,210634.00,16058990.00,30247267592.00,1900000000000,,,,,,,,2,3398.36,3397.60,33.98,weth,v2.loan.fixed,0x9d783e3bbde1663ffa2dcc0bf5eabeccbe3f58475938...,2022-03-30 10:36:00.000000 UTC,2,0x3e3b47b5d433be4708a6bd524facd48bb54d10b1,0xd79275564ccad8e679cbbb5e1c2facd46643a372,0.01,0.01,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-04-13 10:36:00.000000 UTC,14.00,0.10,735355,0x06012c8cf97bead5deae237070f9587f8e7a266d,nftfi,33.89,False,14487091,p2p,2
4,v1.loan.fixed-3,3,v1.loan.fixed,repaid,0xc35A5FEc6BE6957899E15559Be252Db882220b37,0x44DdF3e35Cd2D629d78674FF6BF5b953e2B069fe,0.00,0.00,7,17.38,1970-01-01 00:00:01.589631935,2020-05-16 12:25:35+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,10077100,0x330e8f56d4f6eb07392d8c23858eda1cada42c550ed9...,15430188679,500000,428215,2708977,15430188679,True,True,2020-05-16 12:28:51+00:00,3009500000000000,0x8f70de246186ae66da45404c856b9db431b26bfcbe7f...,13100000072.00,500000.00,122603.00,9570320.00,13100000072.00,500000000000,,,,,,,,3,,,,weth,v1.loan.fixed,0x7d7682a9827b44571da3bdc1f7342d9ad3c985e7aedb...,2022-03-30 10:43:05.000000 UTC,3,0x3e3b47b5d433be4708a6bd524facd48bb54d10b1,0xd79275564ccad8e679cbbb5e1c2facd46643a372,0.01,0.01,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2022-03-30 10:50:17.000000 UTC,0.01,0.73,1000323,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,33.89,False,14487122,p2p,3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
28024,v2-1.loan.fixed-33808,33808,v2-1.loan.fixed,,0xB2A2a6a69E7A0aD66943F4c2869d45A9919CF740,0xF4Fb9FA23edB32215E5284cf7dBfDB5607d51a5b,1.25,0.00,60,39.00,1970-01-01 00:00:01.682357939,2023-04-24 17:38:59+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17117683,0x2573d462a1e5bc8c7085f18a317dee42c6003e86e40b...,60758034730,533673,514285,11129095,60758034730,True,True,NaT,,,,,,,,,,,,,,,,33808,1834.86,1834.07,2292.59,weth,v2-1.loan.fixed,0x2573d462a1e5bc8c7085f18a317dee42c6003e86e40b...,2023-04-24 17:38:59.000000 UTC,33808,0xb2a2a6a69e7a0ad66943f4c2869d45a9919cf740,0xf4fb9fa23edb32215e5284cf7dbfdb5607d51a5b,1.25,1.33,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-06-23 17:38:59.000000 UTC,60.00,0.39,2496,0x42069abfe407c60cf4ae4112bedead391dba1cdb,nftfi,2267.92,False,17117683,p2p,33808
28025,v2-1.loan.fixed-33809,33809,v2-1.loan.fixed,,0xB2A2a6a69E7A0aD66943F4c2869d45A9919CF740,0xF4Fb9FA23edB32215E5284cf7dBfDB5607d51a5b,1.20,0.00,60,39.00,1970-01-01 00:00:01.682358287,2023-04-24 17:44:47+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17117712,0x182b91443edf0fdcdf9210e2792a1475d6c47f9e8175...,51243960438,543473,528885,18678811,51243960438,True,True,NaT,,,,,,,,,,,,,,,,33809,1838.06,1834.08,2200.90,weth,v2-1.loan.fixed,0x182b91443edf0fdcdf9210e2792a1475d6c47f9e8175...,2023-04-24 17:44:47.000000 UTC,33809,0xb2a2a6a69e7a0ad66943f4c2869d45a9919cf740,0xf4fb9fa23edb32215e5284cf7dbfdb5607d51a5b,1.20,1.28,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-06-23 17:44:47.000000 UTC,60.00,0.39,1044,0x42069abfe407c60cf4ae4112bedead391dba1cdb,nftfi,2177.20,False,17117712,p2p,33809
28026,v2-1.loan.fixed-33810,33810,v2-1.loan.fixed,,0xB2A2a6a69E7A0aD66943F4c2869d45A9919CF740,0xF4Fb9FA23edB32215E5284cf7dBfDB5607d51a5b,1.20,0.00,60,39.00,1970-01-01 00:00:01.682358299,2023-04-24 17:44:59+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17117713,0x97b46e05a3d4e573b0cd59df2657c5478081e6a4d12f...,55397766781,533653,514265,6290372,55397766781,True,True,NaT,,,,,,,,,,,,,,,,33810,1838.06,1834.08,2200.90,weth,v2-1.loan.fixed,0x97b46e05a3d4e573b0cd59df2657c5478081e6a4d12f...,2023-04-24 17:44:59.000000 UTC,33810,0xb2a2a6a69e7a0ad66943f4c2869d45a9919cf740,0xf4fb9fa23edb32215e5284cf7dbfdb5607d51a5b,1.20,1.28,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2023-06-23 17:44:59.000000 UTC,60.00,0.39,4770,0x42069abfe407c60cf4ae4112bedead391dba1cdb,nftfi,2177.20,False,17117713,p2p,33810
28027,v2-1.loan.fixed-33824,33824,v2-1.loan.fixed,,0x353D1aF0fA732F6230Ff4ab0eB2a6A3Dcf4C54F2,0x1797b4235473fbE0e7e44322F01C1B5618EBda41,7.00,0.00,365,9.00,1970-01-01 00:00:01.682364971,2023-04-24 19:36:11+00:00,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,17118262,0x862834c19fc5e3255d85ee631d45b38c210055fb8aa8...,55983293990,528871,509483,9778066,55983293990,True,True,NaT,,,,,,,,,,,,,,,,33824,1832.78,1832.01,12824.07,weth,v2-1.loan.fixed,0x862834c19fc5e3255d85ee631d45b38c210055fb8aa8...,2023-04-24 19:36:11.000000 UTC,33824,0x353d1af0fa732f6230ff4ab0eb2a6a3dcf4c54f2,0x1797b4235473fbe0e7e44322f01c1b5618ebda41,7.00,7.63,0xc02aaa39b223fe8d0a0e5c4f27ead9083c756cc2,wETH,2024-04-23 19:36:11.000000 UTC,365.00,0.09,3903,0x059edd72cd353df5106d2b9cc5ab83a52287ac3a,nftfi,12820.53,False,17118262,p2p,33824


In [58]:
subset_of_matching_mq_with_nftfi = matching_mq_with_nftfi[['nftfi_date', 'mq_block_timestamp', 'nftfi_usd_value', 'mq_amt_in_usd', 'nftfi_loan_no_cleaned', 'nftfi_loan_type', 'mq_loan_id_cleaned']]
subset_of_matching_mq_with_nftfi

Unnamed: 0,nftfi_date,mq_block_timestamp,nftfi_usd_value,mq_amt_in_usd,nftfi_loan_no_cleaned,nftfi_loan_type,mq_loan_id_cleaned
0,2020-05-16 10:05:07+00:00,2022-03-30 10:21:32.000000 UTC,,33.89,1,v1.loan.fixed,1
1,2022-03-30 10:21:32+00:00,2022-03-30 10:21:32.000000 UTC,33.95,33.89,1,v2.loan.fixed,1
2,2020-05-16 11:30:55+00:00,2022-03-30 10:36:00.000000 UTC,,33.89,2,v1.loan.fixed,2
3,2022-03-30 10:36:00+00:00,2022-03-30 10:36:00.000000 UTC,33.98,33.89,2,v2.loan.fixed,2
4,2020-05-16 12:25:35+00:00,2022-03-30 10:43:05.000000 UTC,,33.89,3,v1.loan.fixed,3
...,...,...,...,...,...,...,...
28024,2023-04-24 17:38:59+00:00,2023-04-24 17:38:59.000000 UTC,2292.59,2267.92,33808,v2-1.loan.fixed,33808
28025,2023-04-24 17:44:47+00:00,2023-04-24 17:44:47.000000 UTC,2200.90,2177.20,33809,v2-1.loan.fixed,33809
28026,2023-04-24 17:44:59+00:00,2023-04-24 17:44:59.000000 UTC,2200.90,2177.20,33810,v2-1.loan.fixed,33810
28027,2023-04-24 19:36:11+00:00,2023-04-24 19:36:11.000000 UTC,12824.07,12820.53,33824,v2-1.loan.fixed,33824


In [59]:
pd.options.plotting.backend = "plotly"
subset_of_matching_mq_with_nftfi['dollar_diff'] = subset_of_matching_mq_with_nftfi['nftfi_usd_value'] - subset_of_matching_mq_with_nftfi['mq_amt_in_usd']

subset_of_matching_mq_with_nftfi.nftfi_date = pd.to_datetime(subset_of_matching_mq_with_nftfi.nftfi_date)
subset_of_matching_mq_with_nftfi.mq_block_timestamp = pd.to_datetime(subset_of_matching_mq_with_nftfi.mq_block_timestamp)

subset_of_matching_mq_with_nftfi.plot.scatter(x=subset_of_matching_mq_with_nftfi.nftfi_date, y=subset_of_matching_mq_with_nftfi.dollar_diff)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  subset_of_matching_mq_with_nftfi['dollar_diff'] = subset_of_matching_mq_with_nftfi['nftfi_usd_value'] - subset_of_matching_mq_with_nftfi['mq_amt_in_usd']
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  subset_of_matching_mq_with_nftfi.nftfi_date = pd.to_datetime(subset_of_matching_mq_with_nftfi.nftfi_date)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/use

ValueError: Mime type rendering requires nbformat>=4.2.0 but it is not installed

In [None]:
subset_of_matching_mq_with_nftfi['date_diff'] = subset_of_matching_mq_with_nftfi['nftfi_date'] - subset_of_matching_mq_with_nftfi['mq_block_timestamp']
subset_of_matching_mq_with_nftfi.plot.scatter(x=subset_of_matching_mq_with_nftfi.nftfi_date, y=subset_of_matching_mq_with_nftfi.date_diff)

In [None]:
import numpy as np
subset_of_matching_mq_with_nftfi['date_diff'] = subset_of_matching_mq_with_nftfi['nftfi_date'] - subset_of_matching_mq_with_nftfi['mq_block_timestamp']
non_zero_time_delta = subset_of_matching_mq_with_nftfi.loc[subset_of_matching_mq_with_nftfi['date_diff'] > np.timedelta64(0)]
display(non_zero_time_delta)
display(non_zero_time_delta.nftfi_loan_type.unique())

print(f"min, max nftfi [{non_zero_time_delta.nftfi_date.min(), non_zero_time_delta.nftfi_date.max()}]")
print(f"min, max mq [{non_zero_time_delta.mq_block_timestamp.min(), non_zero_time_delta.mq_block_timestamp.max()}]")

print(f"\n\nTotal dollar diff for non zero time deltas (IDs not matching) [{non_zero_time_delta.dollar_diff.sum()}]")
print(f"Total dollar diff for both datasets [{subset_of_matching_mq_with_nftfi.dollar_diff.sum()}]")

In [None]:
nftfi.date = pd.to_datetime(nftfi.date)
time_delta = pd.Timedelta(minutes=20)
datemax_minus_time_delta = non_zero_time_delta.nftfi_date.max() - time_delta
datemax_plus_time_delta = non_zero_time_delta.nftfi_date.max() + time_delta

print(non_zero_time_delta.nftfi_date.max())
nftfi.loc[nftfi.date < datemax_plus_time_delta].loc[datemax_minus_time_delta < nftfi.date].sort_values('date')

In [None]:
non_zero_time_delta.loc[non_zero_time_delta['dollar_diff'] == 0]

### Are missing loans from MQ relative to NFTfi, bundles?

In [None]:
display(nftfi_not_in_mq.collection_name.unique())
len(nftfi_not_in_mq.collection_name.unique())

In [None]:
display(mq_not_in_nftfi.collection_address.unique()[:3])
len(mq_not_in_nftfi.collection_address.unique())

## How are liquidations accounted for?

In [None]:
# TODO:
# spreadsheet of different transactions that are missing, or are more of them on MQ dataset. we need clear doc discussing which tsx are missing, which are added,
# what are the volume differences coming from.

# try and check that the eth value of those loans per transaction is the same.
# check if volumes per loanerc20 collateral are matching

## Sandbox

In [None]:
try: 
    volume = pd.read_csv('analysis/nftfi_cluster_data/3month_200apr_with_borrow_volume.csv')
    base_data = pd.read_csv('analysis/nftfi_cluster_data/20230522_CADLabs_NFTfi NFT collection APR ranges_vDraft - past 3M; loan count 20; APRs 200; 5 clusters.csv')
except FileNotFoundError:
    volume = (
        pd.read_csv('nftfi_cluster_data/3month_200apr_with_borrow_volume.csv')
        .drop(columns=['mean', 'median', 'std', 'count'])
    )
    base_data = (
        pd.read_csv('nftfi_cluster_data/20230522_CADLabs_NFTfi NFT collection APR ranges_vDraft - past 3M; loan count 20; APRs 200; 5 clusters.csv')
        .drop(columns=['Unnamed: 0', 'Unnamed: 7', 'Unnamed: 8'])
    )

In [None]:
display(volume.head(2))
display(base_data.head(2))

In [None]:
nftfi = pd.merge(left=base_data, right=volume, on='collection_name')
nftfi 
# list(nftfi['borrow_volume'].values)