import csv
import datetime
import logging
import numpy as np
import pandas as pd
import os

from collections import defaultdict
from itertools import chain
from pandas.tseries.offsets import BDay

logger = logging.getLogger(__name__)


def convert(x):
    try:
        return float(x[:-1])
    except ValueError:
        return None


def get_index_list(database, workdate):
    with database.cursor() as c:
        c.execute(
            "SELECT distinct index, series FROM index_maturity "
            "WHERE issue_date IS NOT NULL and issue_date <= %s + 10 "
            "AND maturity >= %s",
            (workdate, workdate),
        )
        for index, series in c:
            yield index + str(series)
    database.commit()


DOC_CLAUSE_MAPPING14 = {
    "Full Restructuring": "MM14",
    "No Restructuring": "XR14",
    "Modified Modified Restructurin": "MM14",
}

DOC_CLAUSE_MAPPING = {
    "Full Restructuring": "MM",
    "No Restructuring": "XR",
    "Modified Modified Restructurin": "MM",
}


def get_markit_bbg_mapping(database, basketid_list, workdate):
    markit_bbg_mapping = defaultdict(set)
    all_tickers = set([])
    with database.cursor() as c:
        c.execute(
            "SELECT markit_ticker, markit_tier, spread, currency, cds_curve, "
            " short_code FROM historical_cds_issuers(%s) "
            "JOIN basket_constituents USING (company_id, seniority) "
            "WHERE basketid=ANY(%s)",
            (workdate, list(basketid_list)),
        )
        for line in c:
            all_tickers.add((line.markit_ticker, line.markit_tier))
            key = (
                line.markit_ticker,
                line.markit_tier,
                line.currency,
                line.short_code,
                float(line.spread) / 10000,
            )
            ## each markit ticker can be mapped to multiple bbg tickers
            ## these bbg tickers can have different curves (ok)
            ## or same curves (not ok since date, curve_ticker needs to be unique)
            ## therefore we keep them in a set structure
            markit_bbg_mapping[key].add(tuple(line.cds_curve))
    database.commit()
    return (all_tickers, markit_bbg_mapping)


def get_bbg_tickers(database, basketid_list, workdate):
    with database.cursor() as c:
        c.execute(
            "SELECT distinct cds_curve FROM historical_cds_issuers(%s) "
            "JOIN basket_constituents USING(company_id, seniority) "
            "WHERE basketid=ANY(%s)",
            (workdate, list(basketid_list)),
        )
        yield from chain.from_iterable(e[0] for e in c)
    database.commit()


def get_basketids(database, index_list, workdate):
    with database.cursor() as c:
        for index in index_list:
            c.execute("SELECT * FROM nameToBasketID(%s, %s)", (index, workdate))
            yield c.fetchone()[0]
    database.commit()


def get_current_tickers(database, workdate):
    index_list = get_index_list(database, workdate)
    basketid_list = get_basketids(database, index_list, workdate)
    return get_markit_bbg_mapping(database, basketid_list, workdate)


def insert_cds(database, workdate):
    """insert Markit index quotes into the database

    :param database: psycopg2 connection to the database.
    :param workdate:
    """

    all_tickers, markit_bbg_mapping = get_current_tickers(database, workdate)
    filename = "cds eod {0:%Y%m%d}.csv".format(workdate)
    colnames = [
        "Upfront" + tenor for tenor in ["6m", "1y", "2y", "3y", "4y", "5y", "7y", "10y"]
    ]
    sqlstr = (
        "INSERT INTO cds_quotes(date, curve_ticker, upfrontbid, upfrontask,"
        "runningbid, runningask, source, recovery) VALUES(%s, %s, %s, %s, %s, %s, %s, %s) "
        "ON CONFLICT DO NOTHING"
    )

    tickers_found = set()
    with open(
        os.path.join(os.environ["BASE_DIR"], "Tranche_data", "CDS", filename)
    ) as fh:
        csvreader = csv.DictReader(fh)
        with database.cursor() as c:
            for line in csvreader:
                spread = float(line["RunningCoupon"])
                k = (
                    line["Ticker"],
                    line["Tier"],
                    line["Ccy"],
                    line["DocClause"],
                    spread,
                )
                if k in markit_bbg_mapping:
                    for curves in markit_bbg_mapping[k]:
                        c.executemany(
                            sqlstr,
                            [
                                (
                                    workdate,
                                    t,
                                    convert(line[col]),
                                    convert(line[col]),
                                    spread * 10000,
                                    spread * 10000,
                                    "MKIT",
                                    convert(line["RealRecovery"]) / 100,
                                )
                                for col, t in zip(colnames, curves)
                            ],
                        )
                    tickers_found.add((line["Ticker"], line["Tier"]))
        database.commit()
    logger.warning("missing_quotes for {0}".format(all_tickers - tickers_found))


def get_date(f):
    with open(f) as fh:
        next(fh)
        next(fh)
        next(fh)
        date = next(fh).split(",", 1)[0][1:-1]
    return datetime.datetime.strptime(date, "%d-%b-%y").date()


def insert_index(engine, workdate=None):
    """insert Markit index quotes into the database

    :param engine: sqlalchemy engine to the database
    :param workdate: date. If None, we will try to reinsert all files
    """

    basedir = os.path.join(os.environ["BASE_DIR"], "Tranche_data", "Composite_reports")
    filenames = [
        os.path.join(basedir, f) for f in os.listdir(basedir) if "Indices" in f
    ]

    name_mapping = {
        "CDXNAHY": "HY",
        "CDXNAIG": "IG",
        "iTraxx Eur": "EU",
        "iTraxx Eur Xover": "XO",
    }
    cols = ["close_price", "close_spread", "model_price", "model_spread"]
    colmapping = {
        "Date": "date",
        "Name": "index",
        "Series": "series",
        "Version": "version",
        "Term": "tenor",
        "Composite Price": "close_price",
        "Composite Spread": "close_spread",
        "Model Price": "model_price",
        "Model Spread": "model_spread",
    }
    ext_cols = ["date", "index", "series", "version", "tenor"] + cols + ["source"]

    dates_to_files = {}
    for f in filenames:
        d = get_date(f)
        if d in dates_to_files:
            dates_to_files[d].append(f)
        else:
            dates_to_files[d] = [f]

    if workdate is None:
        filenames = dates_to_files[max(dates_to_files.keys())]
    else:
        filenames = dates_to_files[workdate]

    for f in filenames:
        data = pd.read_csv(f, skiprows=2, parse_dates=[0, 7], engine="python")
        data = data.rename(columns=colmapping)
        data.dropna(subset=["close_price"], inplace=True)
        for col in cols:
            data[col] = data[col].str.replace("%", "").astype("float")
        data["tenor"] = data["tenor"].apply(lambda x: x.lower() + "r")
        data["index"] = data["index"].apply(
            lambda x: name_mapping[x] if x in name_mapping else np.NaN
        )
        data = data.dropna(subset=["index"])
        data["close_spread"] *= 100
        data["model_spread"] *= 100
        ## we renumbered the version for HY9, 10 and 11
        data.loc[data.series.isin([9, 10, 11]) & (data.index == "HY"), "version"] -= 3
        # data = data.groupby(['index', 'series', 'tenor', 'date'], as_index=False).last()
        data["source"] = "MKIT"
        data[ext_cols].to_sql(
            "index_quotes_pre", engine, if_exists="append", index=False
        )


def insert_tranche(engine, workdate=None):
    """insert Markit index quotes into the database

    :param engine: sqlalchemy engine to the database
    :param workdate: If None, we will try to reinsert all files
    :type workdate: pd.Timestamp
    """

    basedir = os.path.join(os.environ["BASE_DIR"], "Tranche_data", "Composite_reports")
    filenames = [
        os.path.join(basedir, f)
        for f in os.listdir(basedir)
        if f.startswith("Tranche Composites")
    ]
    index_version = pd.read_sql_table("index_version", engine, index_col="redindexcode")
    for f in filenames:
        if (
            workdate is None
            or datetime.datetime.fromtimestamp(os.path.getmtime(f)).date()
            == (workdate + BDay(1)).date()
        ):
            df = pd.read_csv(f, skiprows=2, parse_dates=["Date"])
            df.rename(
                columns={
                    "Date": "quotedate",
                    "Index Term": "tenor",
                    "Attachment": "attach",
                    "Detachment": "detach",
                    "Tranche Upfront Bid": "upfront_bid",
                    "Tranche Upfront Mid": "upfront_mid",
                    "Tranche Upfront Ask": "upfront_ask",
                    "Index Price Mid": "index_price",
                    "Tranche Spread Mid": "tranche_spread",
                    "Red Code": "redindexcode",
                },
                inplace=True,
            )
            df.attach = df.attach * 100
            df.detach = df.detach * 100
            df.tranche_spread = df.tranche_spread * 10000
            df.tenor = df.tenor.str.lower() + "r"
            df.set_index("redindexcode", inplace=True)
            df = df.join(index_version)
            df = df.filter(
                [
                    "basketid",
                    "quotedate",
                    "tenor",
                    "attach",
                    "detach",
                    "upfront_bid",
                    "upfront_ask",
                    "upfront_mid",
                    "tranche_spread",
                    "index_price",
                ]
            )
            df.to_sql("markit_tranche_quotes", engine, if_exists="append", index=False)