src/history_visualizer.py from siruku6/fx_alarm_py

src/history_visualizer.py
Summary

Maintainability

5 hrs
Test Coverage

59%
Issues
Coverage
import datetime
from datetime import timedelta
from typing import List, Optional, Tuple, TypedDict

from oanda_accessor_pyv20 import OandaInterface
import oanda_accessor_pyv20.preprocessor as prepro
import pandas as pd

from src.analyzer import Analyzer
from src.candle_loader import CandleLoader
from src.candle_storage import FXBase
from src.drawer import FigureDrawer
import src.lib.format_converter as converter
from src.lib.interface import select_instrument
from src.trader_config import TraderConfig


class DstSwitch(TypedDict):
    time: str
    summer_time: bool


class Visualizer:
    DRAWABLE_ROWS = 200

    def __init__(
        self,
        from_iso: str,
        to_iso: str,
        instrument: str = None,
        indicator_names: Optional[Tuple[str, ...]] = None,
    ):
        self.__instrument: str = instrument or select_instrument()["name"]
        self.__from_iso: str = from_iso
        self.__to_iso: str = to_iso
        self.__client: OandaInterface = OandaInterface(instrument=self.__instrument)
        # TODO: remove TraderConfig from this line
        self.__candle_loader: "CandleLoader" = CandleLoader(
            TraderConfig("unittest", instrument), self.__client, 0
        )
        self.__ana: Analyzer = Analyzer(indicator_names)
        self._indicators: pd.DataFrame = None

    @property
    def indicators(self) -> pd.DataFrame:
        return self._indicators

    @indicators.setter
    def indicators(self, indicators: pd.DataFrame) -> None:
        self._indicators = indicators

    def run(self) -> pd.DataFrame:
        transactions: pd.DataFrame = self.__client.request_massive_transactions(
            self.__from_iso, self.__to_iso
        )
        result: pd.DataFrame = self.__collect_full_dataframe(transactions, granularity="H1")
        return result

    # NOTE: This is not used on AWS Lambda
    def visualize_latest_hist(self, granularity: str) -> None:
        transactions: pd.DataFrame = self.__client.prepare_one_page_transactions()
        result: pd.DataFrame = self.__collect_full_dataframe(transactions, granularity=granularity)

        # INFO: Visualization
        result.to_csv("./tmp/csvs/oanda_trade_hist.csv", index=False)
        self.__draw_history()

    #
    # Private
    #
    def __collect_full_dataframe(
        self, history_df: pd.DataFrame, granularity: str = "M10"
    ) -> pd.DataFrame:
        """
        create dataframe which includes trade-history & time-series currency price

        Parameters
        ----------
        granularity : string
            M1, M5, M10, H1, or D and so on ...

        Returns
        -------
        pd.DataFrame
        """
        candles: pd.DataFrame = self.__prepare_candles(granularity=granularity)
        print("[Libra] candles and trade-logs are loaded")

        result: pd.DataFrame
        if len(history_df) == 0:
            result = candles
        else:
            result = self.__merge_candles_and_hist(candles, history_df, granularity)

        FXBase.set_candles(result)
        print("[Libra] candles and trade-history are merged")

        # prepare indicators
        self.__ana.calc_indicators(candles=result)
        self.indicators: pd.DataFrame = self.__ana.get_indicators()
        print("[Libra] and indicators are merged")

        return pd.merge(result, self.indicators, on="time", how="left")

    def __merge_candles_and_hist(
        self, candles: pd.DataFrame, history_df: pd.DataFrame, granularity: str
    ) -> pd.DataFrame:
        history_df.loc[:, "price"] = history_df.price.astype("float32")
        history_df = self.__adjust_time_for_merging(candles, history_df, granularity)

        # prepare pl_and_gross
        hist_pl_df = self.__extract_pl(granularity, history_df[["time", "pl", "dst"]])
        history_df.drop("pl", axis=1, inplace=True)  # pl カラムは1つあれば十分

        tmp_positions_df = self.__extract_positions_df_from(history_df)
        result = self.__merge_hist_dfs(candles, tmp_positions_df, hist_pl_df)
        result.loc[:, "gross"] = result["pl"].cumsum()
        result["stoploss"] = self.__fill_stoploss(result.copy())
        return result

    def __prepare_candles(self, granularity: str) -> pd.DataFrame:
        buffer_td: timedelta = prepro.granularity_to_timedelta(granularity)
        possible_start_dt: pd.Timestamp = converter.to_timestamp(self.__from_iso) - buffer_td * 20
        # TODO: 400 が適切かどうかはよく検討が必要
        #   400本分なのに、220本しか出てこない。なんか足りない。（休日分の足が存在しないからかも）
        end_dt: pd.Timestamp = converter.to_timestamp(self.__to_iso)
        min_end_dt: pd.Timestamp = end_dt - buffer_td * 400
        start_dt: pd.Timestamp = max(possible_start_dt, min_end_dt)

        result: pd.DataFrame = self.__candle_loader.load_candles_by_duration_for_hist(
            instrument=self.__instrument,
            start=start_dt,
            end=end_dt,
            granularity=granularity,
        )

        return result

    def __adjust_time_for_merging(
        self, candles: pd.DataFrame, history_df: pd.DataFrame, granularity: str
    ) -> pd.DataFrame:
        dict_dst_switches: List[DstSwitch] = None
        if granularity in ("H4",) and len(history_df) > 0:
            # TODO: dict_dst_switches は H4 candles でのみしか使えない形になっている
            dict_dst_switches = self.__detect_dst_switches(candles)
            history_df = self.__append_dst_column(history_df, dst_switches=dict_dst_switches)
        else:
            history_df.loc[:, "dst"] = None

        # make time smooth, adaptively to Daylight Saving Time
        if granularity == "M10":  # TODO: M15, 30 も対応できるようにする
            history_df["time"] = [converter.convert_to_m10(time) for time in history_df.time]
        elif granularity in ("H1", "H4"):
            history_df["time"] = [
                self.__convert_time_str_to(granularity, time, dict_dst_switches)
                for time in history_df.time
            ]
        return history_df

    def __detect_dst_switches(self, candles: pd.DataFrame) -> List[DstSwitch]:
        """
        daylight saving time の切り替わりタイミングを見つける
        """
        candles["summer_time"] = pd.to_numeric(candles.time.str[12], downcast="signed") % 2 == 1
        switch_points = candles[candles.summer_time != candles.summer_time.shift(1)][
            ["time", "summer_time"]
        ]
        return switch_points.to_dict("records")  # type: ignore

    def __append_dst_column(
        self, original_df: pd.DataFrame, dst_switches: List[DstSwitch]
    ) -> pd.DataFrame:
        """
        dst is Daylight Saving Time

        Parameters
        ----------
        dst_switches : array of dict
            sample: [
                {'time': '2020-02-17 06:00:00', 'summer_time': False},
                {'time': '2020-03-12 17:00:00', 'summer_time': True},
                ...
            ]
        """
        hist_df = original_df.copy()
        switch_count = len(dst_switches)

        for i, dst_switching_point in enumerate(dst_switches):
            is_dst = dst_switching_point["summer_time"]
            if i == (switch_count - 1):
                target_row_index = dst_switching_point["time"] <= hist_df["time"]
            else:
                target_row_index = (dst_switching_point["time"] <= hist_df["time"]) & (
                    hist_df["time"] < dst_switches[i + 1]["time"]
                )
            hist_df.loc[target_row_index, "dst"] = is_dst

        hist_df["dst"] = hist_df["dst"].astype(bool)
        return hist_df

    def __convert_time_str_to(
        self,
        granularity: str,
        oanda_time: str,
        dict_dst_switches: Optional[List[DstSwitch]],
    ) -> str:
        time_str: str = oanda_time.replace("T", " ")
        # INFO: 12文字目までで hour まで取得できる
        time: datetime.datetime = datetime.datetime.strptime(time_str[:13], "%Y-%m-%d %H")

        # INFO: adjust according to day light saving time
        if granularity in ("H4",):
            if self.__is_summer_time(time_str, dict_dst_switches):
                # INFO: OandaのH4は [1,5,9,13,17,21] を取り得るので、それをはみ出した時間を切り捨て
                minus = (time.hour + 3) % 4
            else:
                minus = time.hour % 4
            time -= datetime.timedelta(hours=minus)

        hour_str: str = time.strftime("%Y-%m-%d %H:%M:%S")
        return hour_str

    def __is_summer_time(self, time_str: str, dict_dst_switches: List[DstSwitch]) -> bool:
        for i, switch_dict in enumerate(dict_dst_switches):
            if dict_dst_switches[-1]["time"] < time_str:
                return dict_dst_switches[-1]["summer_time"]
            elif switch_dict["time"] < time_str and time_str < dict_dst_switches[i + 1]["time"]:
                return switch_dict["summer_time"]

    def __extract_pl(self, granularity: str, original_df: pd.DataFrame) -> pd.DataFrame:
        """
        Parameters
        ----------
        granularity : string
        original_df : dataframe
            .index -> name: time, type: datetime
            .columns -> [
                'pl', # integer
                'dst' # boolean
            ]

        Returns
        ----------
        pl_hist : dataframe
        """
        if granularity in ("H4",):
            pl_hist = self.__downsample_pl_df(pl_df=original_df)
        elif granularity in ("H1",):
            pl_hist = self.__resample_by("1H", original_df.copy())
        else:
            pl_hist = original_df.copy()
        pl_hist.reset_index(inplace=True)
        pl_hist.loc[:, "time"] = pl_hist["time"].astype({"time": str})
        return pl_hist

    def __downsample_pl_df(self, pl_df: pd.DataFrame) -> pd.DataFrame:
        # time 列の調節と resampling
        hist_dst_on = self.__resample_by("4H", pl_df[pl_df["dst"]].copy(), offset="1h")
        hist_dst_off = self.__resample_by("4H", pl_df[~pl_df["dst"]].copy(), offset="0h")
        return hist_dst_on.append(hist_dst_off).sort_index()

    def __resample_by(
        self,
        rule: str,
        target_df: pd.DataFrame,
        offset: str = "0h",
    ) -> pd.DataFrame:
        target_df.loc[:, "time"] = pd.to_datetime(target_df["time"])
        if target_df.empty:
            return target_df[[]]

        return target_df.resample(rule, on="time", offset=offset).sum()

    def __merge_hist_dfs(
        self, candles: pd.DataFrame, tmp_positions_df: pd.DataFrame, hist_pl_df: pd.DataFrame
    ) -> pd.DataFrame:
        result: pd.DataFrame = pd.merge(candles, tmp_positions_df, on="time", how="left")
        result = pd.merge(result, hist_pl_df, on="time", how="left").drop_duplicates(["time"])
        result["pl"].fillna(0, inplace=True)
        return result

    def __extract_positions_df_from(self, d_frame: pd.DataFrame) -> pd.DataFrame:
        tmp_positions_df = (
            d_frame.dropna(subset=["tradeOpened"])[["price", "time", "units"]]
            .copy()
            .rename(columns={"price": "long"})
        )
        tmp_positions_df["short"] = tmp_positions_df["long"].copy()
        exits = (
            d_frame.dropna(subset=["tradesClosed"])[["price", "time"]]
            .copy()
            .rename(columns={"price": "exit"})
        )
        stoplosses = (
            d_frame[d_frame.type == "STOP_LOSS_ORDER"][["price", "time"]]
            .copy()
            .rename(columns={"price": "stoploss"})
        )
        tmp_positions_df = pd.merge(tmp_positions_df, exits, on="time", how="outer")
        tmp_positions_df = pd.merge(tmp_positions_df, stoplosses, on="time", how="outer")
        tmp_positions_df["units"] = tmp_positions_df["units"].fillna("0").astype(int)

        # INFO: remove unused records & values
        tmp_positions_df = tmp_positions_df.sort_values("time").drop_duplicates("time")
        # INFO: Nan は描画されないが None も描画されない
        tmp_positions_df.loc[tmp_positions_df.units <= 0, "long"] = None
        tmp_positions_df.loc[tmp_positions_df.units >= 0, "short"] = None

        return tmp_positions_df  # , exit_df, trail_df

    def __fill_stoploss(self, hist_df: pd.DataFrame) -> pd.DataFrame:
        """entry ~ exit の間の stoploss を補完"""
        hist_df.loc[pd.notna(hist_df["exit"].shift(1)), "entried"] = False
        is_long_or_short = hist_df[["long", "short"]].any(axis=1)
        hist_df.loc[is_long_or_short, "entried"] = True
        hist_df["entried"] = hist_df["entried"].fillna(method="ffill").fillna(False)
        hist_df["stoploss"] = hist_df.loc[hist_df["entried"], "stoploss"].fillna(method="ffill")
        return hist_df.loc[:, "stoploss"]

    def __draw_history(self) -> None:
        # INFO: データ準備
        candles_and_hist = (
            FXBase.get_candles(start=-Visualizer.DRAWABLE_ROWS, end=None)
            .copy()
            .reset_index(drop=True)
        )
        # TODO: candles_and_hist にも indicators データが丸々入っているので、次の行は修正した方がよい
        drawn_indicators = self.indicators[-Visualizer.DRAWABLE_ROWS : None]

        # - - - - - - - - - - - - - - - - - - - -
        #                  描画
        # - - - - - - - - - - - - - - - - - - - -
        drawer = FigureDrawer(rows_num=3, instrument=self.__instrument)
        drawer.draw_indicators(d_frame=drawn_indicators.reset_index(drop=True))

        # INFO: 取引履歴・Position関連の描画
        if "long" in candles_and_hist.columns:
            self.__draw_hists(drawer, drawn_indicators, candles_and_hist)

        target_candles = candles_and_hist.iloc[-Visualizer.DRAWABLE_ROWS :, :]  # 200本より古い足は消している
        drawer.draw_candles(target_candles)
        result = drawer.create_png(
            granularity="real-trade", sr_time=candles_and_hist.time, num=0, filename="hist"
        )
        drawer.close_all()
        print(result["success"])

    def __draw_hists(
        self, drawer: FigureDrawer, drawn_indicators: pd.DataFrame, candles_and_hist: pd.DataFrame
    ) -> None:
        drawer.draw_vertical_lines(
            indexes=candles_and_hist[["long", "short"]].dropna(how="all").index,
            vmin=drawn_indicators["sigma*-2_band"].min(skipna=True),
            vmax=drawn_indicators["sigma*2_band"].max(skipna=True),
        )

        for column_name in ["long", "short", "exit"]:
            drawer.draw_positions_df(
                positions_df=candles_and_hist[[column_name]].rename(columns={column_name: "price"}),
                plot_type=drawer.PLOT_TYPE[column_name],
            )
        drawer.draw_positions_df(
            positions_df=candles_and_hist[["stoploss"]].rename(columns={"stoploss": "price"}),
            plot_type=drawer.PLOT_TYPE["trail"],
        )

        # axis3
        candles_and_hist["gross"].fillna(method="ffill", inplace=True)
        drawer.draw_df(candles_and_hist[["gross"]], names=["gross"])
        drawer.draw_df(candles_and_hist[["pl"]], names=["profit"])