aboutsummaryrefslogtreecommitdiffstats
path: root/python/experiments/test_dask.py
blob: b790f9b4feb38d1774416472b6b6292fecb8355f (plain)
1
2
3
4
5
6
7
8
import dask.dataframe as dd
converters = {f'Spread{t}': lambda s: float(s.rstrip('%'))/100 if s else np.nan \
              for t in ['6m'] + [f'{y}y' for y in [1, 2, 3, 4, 5, 7, 10, 15, 20, 30]]}
df = dd.read_csv("*.csv", skiprows=2, converters=converters,
                 dtype={'CompositeLevel4y': 'object', 'Rating4y': 'object',
                        'CompositeDepth5y': 'object', 'AvRating': 'object',
                        'ImpliedRating':'object'},
                 parse_dates=['Date'])