import os
import sys
import time
import datetime
import struct
import calendar
from dateutil.parser import parse

import numpy as np
import pandas as pd
from pandas import DataFrame, Series
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib inline

MT4のヒストリフォルダを指定します¶

通常ヒストリのフォルダはroamingフォルダの中だったと思いますが僕は /portable をつけて起動しているのでroamingじゃないとこにヒストリフォルダがあるのでこんな感じのパスになってます

HST_DIR = r'D:\MT4\FXCM MetaTrader 4\history\FXCM-JPYDemo01'

hstファイルを読み込むクラス¶

__init__()にヒストリファイルのパスを渡して読み込む感じで使うようにしました

class MT4hstReader(object):
    """mt4 hst reader
    arg: hst file path
    """
    def __init__(self, path=None):
        self.HEADER_SIZE = 148
        self.BAR_BYTE = 60
        self.headerdict_keys = [
            'var', 'copyright', 'symbol',
            'period', 'digits', 'timesign',
            'last_sync', 'unsused'
        ]
        self.filepath = path
        if self.filepath: self._init()
    
    def set_path(self, path):
        """set file path & read info"""
        self.filepath = path
        self._init()
    
    def print_fileinfo(self):
        """print header info"""
        print '\n'.join(['{}: {}'.format(k, self.header_dict[k])
                         for k in self.headerdict_keys])
        print (
            'filesize: {}byte\nbars: {}\n'
            'firstbartime: {} [{}]\nlastbartime: {} [{}]'
        ).format(
            self.filesize, self.bars,
            self.firstbartime,
            datetime.datetime.utcfromtimestamp(self.firstbartime),
            self.lastbartime,
            datetime.datetime.utcfromtimestamp(self.lastbartime)
        )
    
    def hst_symbol(self):
        """str hst symbol"""
        return self.header_dict['symbol']
    
    def hst_period(self):
        """int hst period"""
        return int(self.header_dict['period'])
    
    def hst_digits(self):
        """int hst digits"""
        return int(self.header_dict['digits'])
    
    def get_data(self, n=0, idx=0, mt4index=False, method='py'):
        """get hst data
        arg:
            n: read bars
            idx: readidx mt4timeseries index
            mt4index: ret index type, True=mt4timeseries
            method: 'py':pure python  'np':numpy  'df':pd.DataFrame
        ret:
            MqlRates[idx+n-1] ~ MqlRates[idx]
            py: [(int, float, float, float, float, int)]
            np: [('t', '<i8'), ('o', '<f8'), ('h', '<f8'),
                 ('l', '<f8'), ('c', '<f8'), ('v', '<i8')]
            df: float64
        """
        if idx>self.bars-1 or idx<0:
            print 'idx out of range'
            return None
        if n==0 or n>self.bars-idx:
            n = self.bars-idx
        readstart_pos = self.HEADER_SIZE + (self.bars-n-idx)*self.BAR_BYTE
        rates = None
        with open(self.filepath, 'rb') as f:
            if method!='py':
                # np or df
                dtype = np.dtype([('t','i8'), ('o','f8'), ('h','f8'), ('l','f8'),
                                  ('c','f8'), ('v','i8'), ('s','i4'), ('r','i8')])
                dtype_tohlcv = np.dtype([('t','i8'), ('o','f8'), ('h','f8'),
                                         ('l','f8'), ('c','f8'), ('v','i8')])
                rates = np.frombuffer(f.read(), dtype=dtype, count=n,
                                      offset=readstart_pos).astype(dtype_tohlcv)
                if mt4index: rates=rates[::-1]
                if method=='df': rates=DataFrame(rates)
            else:
                # pure python
                f.seek(readstart_pos, os.SEEK_SET)
                
                # rates = [self._unpack_bar_data(f.read(self.BAR_BYTE))
                #          for _ in xrange(n)]
        
                # 一旦変数に入れてmapで処理(上のより少し速いけど余分にメモリを食う?)
                data = f.read(self.BAR_BYTE*n)
                rates = map(self._unpack_bar_data, [data[i:i+self.BAR_BYTE]
                            for i in xrange(0, len(data), self.BAR_BYTE)])
                if mt4index: rates.reverse()
        return rates
    
    def get_data_dt(self, startdate=None, enddate=None, mt4index=False, method='py'):
        """get hst data
        arg: startdate, enddate: str or datetime.datetime or unixepoch
        """
        st, ed = self._get_idx_tuple(startdate, enddate)
        return self.get_data(st-ed+1, ed, mt4index, method)
    
    def _get_idx_tuple(self, startdate=None, enddate=None):
        """
        指定された期間のインデックスのタプルを返す
        はじめにおおよその位置にシークしてそこからwhileで探す
        argtypes:
            str or datetime.datetime or unixepoch
        ret: (startdate_idx, enddate_idx)
        example:
            call: ('2015-01-01', 2015-12-31)
            ret: (350, 100)
        memo:
            MT4の時系列配列のインデックスに見立てて計算している
        """
        def to_epoch(date):
            if isinstance(date, str):
                return calendar.timegm(parse(date).timetuple())
            elif isinstance(date, datetime.datetime):
                return calendar.timegm(date.timetuple())
            elif isinstance(date, int):
                return date
        st_epoch = self.firstbartime if startdate is None else to_epoch(startdate)
        ed_epoch = self.lastbartime if enddate is None else to_epoch(enddate)
        if st_epoch is None or ed_epoch is None:
            if not st_epoch: print '_get_idx_tuple() arg err!!! check startdate'
            if not ed_epoch: print '_get_idx_tuple() arg err!!! check enddate'
            return None
        if st_epoch>ed_epoch:
            st_epoch, ed_epoch = ed_epoch, st_epoch
        st_epoch = max(self.firstbartime, min(self.lastbartime, st_epoch))
        ed_epoch = max(self.firstbartime, min(self.lastbartime, ed_epoch))
        min_idx = 0
        max_idx = self.bars-1
        timerange = float(self.lastbartime-self.firstbartime)
        st_abaut_idx = int((self.lastbartime-st_epoch)/timerange*(max_idx))
        ed_abaut_idx = int((self.lastbartime-ed_epoch)/timerange*(max_idx))
        
        def read_datetime(f):
            # mt4のdatetime8byteを読んでseek位置を戻す
            t = struct.unpack('Q', f.read(8))[0]
            f.seek(-8, os.SEEK_CUR)
            return t
        def index_seek(f, i):
            # MT4時系列配列のindexの値でseekする
            i = max(min_idx, min(max_idx, i))
            f.seek(-self.BAR_BYTE-(i*self.BAR_BYTE), os.SEEK_END)
        def pos_to_index(f):
            # 現在の位置をmt4の時系列配列のindexに変換
            return (self.filesize-f.tell())/self.BAR_BYTE-1
        def search(f, search_t, method='l'):
            # methodはちょうどの時刻がないとき左右どっちの足のindexを返すか('l' or 'r')
            idx = pos_to_index(f)
            t = read_datetime(f)
            timer = time.clock()
            # ストレージの種類によりけりだと思うけど異様に遅かったら中止
            # プログラムのミスのせいも考えられる
            limit_sec = 10
            while 1:
                if t==search_t: return idx
                idx += 1 if t>search_t else -1
                if idx<=min_idx: return min_idx
                if idx>=max_idx: return max_idx
                pre_t = t
                index_seek(f, idx)
                t = read_datetime(f)
                if min(t, pre_t) < search_t < max(t, pre_t):
                    if t>pre_t: return idx+1 if method=='l' else idx
                    if t<pre_t: return idx if method=='l' else idx-1
                if time.clock()>timer+limit_sec:
                    print 'time over!!! search() bug???'
                    return None
        
        with open(self.filepath, 'rb') as f:
            index_seek(f, st_abaut_idx)
            st_idx = search(f, st_epoch, 'r')
            index_seek(f, ed_abaut_idx)
            ed_idx = search(f, ed_epoch, 'l')
            return st_idx, ed_idx
        return None
    
    def _unpack_bar_data(self, data):
        """ret: tuple(datetime, o, h, l, c, v)"""
        return struct.unpack('QddddQQL', data)[:-2]
    
    def _unpack_header_data(self, data):
        """set headerinfo dict"""
        readsize = [4, 64, 12, 4, 4, 4, 4, 52]
        unpackcmd = ['L', '64s', '12s', 'L', 'L', 'L', 'L', '13L']
        dic = {}
        read = 0
        for k,rs,c in zip(self.headerdict_keys, readsize, unpackcmd):
            dic[k] = struct.unpack(c, data[read:read+rs])[0]
            read += rs
        return dic
    
    def _init(self):
        """read hstfile info
        set: filesize, header, firstbartime, lastbartime, bars
        """
        if not os.path.exists(self.filepath):
            print 'file not found'
            return None
        self.filesize = os.path.getsize(self.filepath)
        self.bars = (self.filesize-self.HEADER_SIZE)/self.BAR_BYTE
        with open(self.filepath, 'rb') as f:
            self.header_dict = self._unpack_header_data(f.read(self.HEADER_SIZE))
            self.firstbartime = self._unpack_bar_data(f.read(self.BAR_BYTE))[0]
            f.seek(-self.BAR_BYTE, os.SEEK_END)
            self.lastbartime = self._unpack_bar_data(f.read(self.BAR_BYTE))[0]

試しに使ってみます¶

filename = os.path.join(HST_DIR, 'USDJPY60.hst')
hstreader = MT4hstReader(filename)

# hstのヘッダ情報を見てみる
hstreader.print_fileinfo()

var: 401
copyright: (C)opyright 2003, MetaQuotes Software Corp.
symbol: USDJPY
period: 60
digits: 3
timesign: 1326176242
last_sync: 0
unsused: 0
filesize: 6099388byte
bars: 101654
firstbartime: 946857600 [2000-01-03 00:00:00]
lastbartime: 1463785200 [2016-05-20 23:00:00]

get_data()でデータを読み込む¶

type_pylist = hstreader.get_data(n=10)
print type(type_pylist)
for i in type_pylist:
    print i

<type 'list'>
(1463752800, 110.343, 110.439, 110.327, 110.335, 3587)
(1463756400, 110.335, 110.402, 110.266, 110.331, 5100)
(1463760000, 110.332, 110.483, 110.278, 110.474, 7081)
(1463763600, 110.47, 110.578, 110.414, 110.454, 6775)
(1463767200, 110.449, 110.555, 110.446, 110.524, 4732)
(1463770800, 110.525, 110.531, 110.426, 110.481, 3324)
(1463774400, 110.481, 110.49, 110.124, 110.177, 4943)
(1463778000, 110.178, 110.241, 110.071, 110.228, 3519)
(1463781600, 110.227, 110.227, 110.098, 110.156, 2782)
(1463785200, 110.155, 110.205, 110.068, 110.097, 1160)

# method='np'で読み込んでみる　本数が多いとこっちが速いぽい
type_np = hstreader.get_data(n=10, method='np')
print type(type_np)
for i in type_np:
    print i

<type 'numpy.ndarray'>
(1463752800L, 110.343, 110.439, 110.327, 110.335, 3587L)
(1463756400L, 110.335, 110.402, 110.266, 110.331, 5100L)
(1463760000L, 110.332, 110.483, 110.278, 110.474, 7081L)
(1463763600L, 110.47, 110.578, 110.414, 110.454, 6775L)
(1463767200L, 110.449, 110.555, 110.446, 110.524, 4732L)
(1463770800L, 110.525, 110.531, 110.426, 110.481, 3324L)
(1463774400L, 110.481, 110.49, 110.124, 110.177, 4943L)
(1463778000L, 110.178, 110.241, 110.071, 110.228, 3519L)
(1463781600L, 110.227, 110.227, 110.098, 110.156, 2782L)
(1463785200L, 110.155, 110.205, 110.068, 110.097, 1160L)

# method='df'で読み込んでみる
type_df = hstreader.get_data(n=10, method='df')
type_df

get_data_dt()で読み込む¶

文字列を渡せば日付文字列としてパースして処理する
dateutil.parserでパースできる文字列ならOKになってるはず
datetime.datetimeオブジェクトを渡してもいい
整数が渡されたらMT4のdatetimeと同様に扱う

# 日付文字列で読み込む
for i in hstreader.get_data_dt(startdate='2016-01-01')[:5]:
    print i
print '-'*60

# datetime.datetimeで読み込む
for i in hstreader.get_data_dt(datetime.datetime(2016, 1, 1))[:5]:
    print i
print '-'*60

# epoch秒で読み込む
t = calendar.timegm(datetime.datetime(2016, 1, 1).timetuple())
print 't={}'.format(t)
for i in hstreader.get_data_dt(t)[:5]:
    print i
# 1/1を指定してるけどその日はデータがないので先頭は2日かなんかのデータになってると思います

(1451865600, 120.2, 120.299, 120.184, 120.27, 1709)
(1451869200, 120.274, 120.372, 120.22, 120.304, 5003)
(1451872800, 120.304, 120.379, 120.255, 120.359, 8089)
(1451876400, 120.359, 120.453, 119.996, 120.017, 11509)
(1451880000, 120.016, 120.032, 119.633, 119.806, 18887)
------------------------------------------------------------
(1451865600, 120.2, 120.299, 120.184, 120.27, 1709)
(1451869200, 120.274, 120.372, 120.22, 120.304, 5003)
(1451872800, 120.304, 120.379, 120.255, 120.359, 8089)
(1451876400, 120.359, 120.453, 119.996, 120.017, 11509)
(1451880000, 120.016, 120.032, 119.633, 119.806, 18887)
------------------------------------------------------------
t=1451606400
(1451865600, 120.2, 120.299, 120.184, 120.27, 1709)
(1451869200, 120.274, 120.372, 120.22, 120.304, 5003)
(1451872800, 120.304, 120.379, 120.255, 120.359, 8089)
(1451876400, 120.359, 120.453, 119.996, 120.017, 11509)
(1451880000, 120.016, 120.032, 119.633, 119.806, 18887)

MultiColumnのDataFrameで読み込むやつも作りました¶

__init__()にヒストリフォルダのパスを渡すようにして使うようにしました
データの読み込み自体は上で定義したMT4hstReaderを使います

class MT4hstDF(object):
    """mt4 hst to pd.DataFrame"""
    
    def __init__(self, hstdirpath=None):
        self.hstdirpath = hstdirpath
        self.hstreader = MT4hstReader()
    
    def set_hstdir(self, path):
        """set hst dir path"""
        self.hstdirpath = path
    
    def get_df(self, symbollist, tf, offsethour=0,
               h1_to_d1=False, summertime=False, n=0, idx=0,
               startdate=None, enddate=None, collist=None):
        """
        get multicolumns dataframe
        args:
            symbollist: list
            tf: int
            offsethour: int
            h1_to_d1: bool
            summertime: bool
            n: int
            idx: int 
            startdate, enddate: datetime or str or int_unixepoch
        ret:
            pd.DataFrame
            index: pandas.tseries.index.DatetimeIndex
            collist: pandas.core.index.MultiIndex
            ret example:
                -----------------------------------------...
                |           |EURUSD             |GBPUSD  ...
                |----------------------------------------...
                |           |o  |h  |l  |c  |v  |o  |h  |...
                |----------------------------------------...
                |t          |   |   |   |   |   |   |   |...
                |----------------------------------------...
                |2016-02-25 |val|val|val|val|val|val|val|....
                |----------------------------------------...
                |2016-02-26 |val|val|val|val|val|val|val|...
                |----------------------------------------...
                |2016-02-27 |val|val|val|val|val|val|val|...
                |----------------------------------------...
        example:
            MT4hstDF_object.get_df(
                    ['EURUSD', 'GBPUSD', 'USDJPY'], 60,
                    startdate='2015-01-01', enddate='2015-12-31')
        """
        if collist is None:
            collist = 'o h l c v'.split()
        h2d = False
        if tf==1440 and h1_to_d1:
            h2d = True
        datalist = []
        for symbol in symbollist:
            filepath = os.path.join(self.hstdirpath,
                                    symbol+str(60 if h2d else tf)+'.hst')
            if not os.path.exists(filepath):
                continue
            self.hstreader.set_path(filepath)
            if startdate is not None or enddate is not None:
                df = self.hstreader.get_data_dt(method='df',
                                                startdate=startdate,
                                                enddate=enddate)
            else:
                df = self.hstreader.get_data(method='df', n=n, idx=idx)
            df = df.set_index(pd.to_datetime(df['t'], unit='s')
                             ).drop('t', axis=1)[collist]
            if offsethour:
                df.index += pd.tseries.offsets.Hour(offsethour) # adj index
            if h2d:
                df=self.__h1df_to_d1(df, summertime, collist) # h1tod1
            df.columns = pd.MultiIndex.from_product([symbol, df.columns])
            datalist.append(df)
        return pd.concat(datalist, axis=1)
    
    def __h1df_to_d1(self, df, summertime, collist):
        """get_df sub routine"""
        w, s = 7, 7
        if summertime: s-=1
        df.index = self.__hour_shift(df.index, -w, -s)
        ohlc_dict = {'o':'first', 'h':'max', 'l':'min', 'c':'last', 'v':'sum'}
        ohlc_dict = {k:v for k,v in ohlc_dict.items() if k in collist}
        df = df.resample('D', how=ohlc_dict).dropna()[collist]
        df.index = self.__hour_shift(df.index, w, s)
        return df
    
    def __hour_shift(self, index, w, s):
        """get_df sub routine"""
        st_date_dic = {y:self.__get_summertime_tuple(y, index.tz)
                       for y in range(index[0].year, index[-1].year+1)}
        def f(date):
            st, ed = st_date_dic[date.year]
            return (date+datetime.timedelta(hours=s) if ed>=date>=st
                    else date+datetime.timedelta(hours=w))
        return map(f, index)
    
    def __get_summertime_tuple(self, y, tz):
        """get_df sub routine"""
        mn3  = pd.date_range('{}-03-01'.format(y),
                             '{}-04-01'.format(y), tz=tz)[:-1]
        mn11 = pd.date_range('{}-11-01'.format(y),
                             '{}-12-01'.format(y), tz=tz)[:-1]
        def f(mn):
            month = mn[0].month
            sdcnt = 0
            for d, wd in zip(mn, map(lambda x: x.weekday() ,mn)):
                if month==3:
                    if wd==6: sdcnt += 1
                    if sdcnt==2: return d # 3月第2日曜日
                else:
                    if wd==6: return d-datetime.timedelta(days=1) # 11月第1日曜日
        return f(mn3), f(mn11)

ヒストリフォルダのパスを渡します¶

dfreader = MT4hstDF(HST_DIR)

"""
def get_df(self, symbollist, tf, offsethour=0,
           h1_to_d1=False, summertime=False, n=0, idx=0,
           startdate=None, enddate=None, collist=None)

symbollisetは通貨ペア名のリスト
dfはタイムフレーム 1,5,15,30,60,240,1440 のような整数を渡します
offsethourはdatetime.indexの調整　何時間ずらすか入れる
h1_to_d1はTrueでH1のデータから日足データを作る
    日足が6本のとことかだと微妙なのでH1から日足を作るとき使う
summertimeは夏時間の部分をずらすときのために作ったような気がするがよく覚えてない(´・ω・｀)

n=0, idx=0, startdate=None, enddate=None
は本数で読み込むか、日付文字列やdatetime.datetimeで読み込むかの引数で好きなほうを使う
collistは読み込む列デフォルトは t o h l c v を読み込む
"""

symbols = ['EURUSD', 'GBPUSD', 'USDJPY',
           'EURJPY', 'GBPJPY', 'EURGBP',
           'AUDUSD', 'USDCHF', 'USDCAD']

df = dfreader.get_df(symbols, 60, startdate='2010-01-01')
print df.columns
print df.shape
df.tail()

MultiIndex(levels=[[u'AUDUSD', u'EURGBP', u'EURJPY', u'EURUSD', u'GBPJPY', u'GBPUSD', u'USDCAD', u'USDCHF', u'USDJPY'], [u'c', u'h', u'l', u'o', u'v']],
           labels=[[3, 3, 3, 3, 3, 5, 5, 5, 5, 5, 8, 8, 8, 8, 8, 2, 2, 2, 2, 2, 4, 4, 4, 4, 4, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 7, 7, 7, 7, 7, 6, 6, 6, 6, 6], [3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4, 3, 1, 2, 0, 4]])
(39634, 45)

# 曜日別、時間別の値幅をプロットしてみる(´・ω・｀)
hl = DataFrame()
for symbol in df.columns.levels[0]:
    hl = pd.concat(
        [hl, DataFrame((df[symbol]['h']-df[symbol]['l'])/df[symbol]['o']*100, columns=[symbol])],
        axis=1
    )

wdays = np.array('mon tue wed thu fri sat sun'.split())
hl['hour'] = hl.index.hour
hl['weekday'] = wdays[hl.index.weekday]

gbw = hl.groupby('weekday')
gbh = hl.groupby('hour')
gbwm = gbw.mean().loc[wdays[:5]]
gbhm = gbh.mean()

gbwm[[i for i in gbwm.columns if i!='hour']].plot(figsize=(15,4), style='-o')
gbhm.plot(figsize=(15,4), style='-o')

<matplotlib.axes._subplots.AxesSubplot at 0xb245ef0>

日足の終値を読み込んでみます¶

d1 = dfreader.get_df(symbols, 1440, startdate='2013-01-01', collist=['c'])
d1.tail()

(1+d1.pct_change()).fillna(1).cumprod().plot(figsize=(15,5))

<matplotlib.axes._subplots.AxesSubplot at 0xb0720f0>

# ヒストリカルボラティリティ　1行でかけると気持ちいい(´・ω・｀)
if pd.__version__>='0.18.0':
    (np.log1p((d1.pct_change()).fillna(0)).rolling(20).std()*np.sqrt(250)).plot(figsize=(15,5))
else:
    (pd.rolling_std(np.log1p((d1.pct_change()).fillna(0)), 20)*np.sqrt(250)).plot(figsize=(15,5))

KuChartも作ってみる(´・ω・｀)¶

def get_straight(symbol, df):
    df_symbols = df.columns.levels[0]
    if symbol in df_symbols:
        return df[symbol]['c']
    cross_jpy = symbol.replace('USD', '')+'JPY'
    if cross_jpy in df_symbols:
        if symbol.index('USD')==3:
            return df[cross_jpy]['c'] / df['USDJPY']['c']
        if symbol.index('USD')==0:
            return df['USDJPY']['c'] / df[cross_jpy]['c']
    print 'err'

def get_cross(symbol, straight_dic):
    st_base = {k:v for k,v in straight_dic.items() if symbol[:3] in k}
    st_quote = {k:v for k,v in straight_dic.items() if symbol[3:] in k}
    b_usd_idx = st_base.keys()[0].index('USD')
    q_usd_idx = st_quote.keys()[0].index('USD')
    if b_usd_idx==3 and q_usd_idx==3:
        return st_base.values()[0] / st_quote.values()[0]
    elif b_usd_idx==3 and q_usd_idx==0:
        return st_base.values()[0] * st_quote.values()[0]
    elif b_usd_idx==0 and q_usd_idx==0:
        return st_quote.values()[0] / st_base.values()[0]
    print 'err'

def get_KuChart(df, currencys=None, multicols=False):
    default = 'EUR GBP AUD NZD USD CAD CHF JPY'.split()
    currencys = [c for c in default if c in currencys] if currencys else default
    usd_idx = currencys.index('USD')
    straight_symbols = [c+'USD' if currencys.index(c)<usd_idx else 'USD'+c
                        for c in currencys if c!='USD']
    cross_symbols = [currencys[i]+currencys[j]
                     for i in range(len(currencys))
                     for j in range(i+1, len(currencys))
                     if not 'USD' in currencys[i]+currencys[j]]
    straight_close_dic = {s:get_straight(s, df) for s in straight_symbols}
    cross_close_dic = {s:get_cross(s, straight_close_dic) for s in cross_symbols }
    price_dic = dict(straight_close_dic, **cross_close_dic)
    price_dic = dict([[k,np.log1p(v.pct_change().fillna(0))] for k,v in price_dic.items()])
    f = lambda keys,d,c:sum(d[k] if k.index(c)==0 else -d[k] for k in keys)/len(keys)
    ku = DataFrame({c: f([k for k in price_dic.keys() if c in k], price_dic, c)
                    for c in currencys})
    if multicols:
        ku.columns = pd.MultiIndex.from_product(['ku', ku.columns])
    return ku

ku = get_KuChart(d1, 'EUR GBP AUD USD CAD CHF JPY'.split())
ku.tail()

ku_clr_dic = {'EUR':'Red', 'GBP':'Lime', 'AUD':'RoyalBlue', 'NZD':'Violet',
              'USD':'Orange', 'CAD':'BlueViolet', 'CHF':'Gray', 'JPY':'Turquoise'}
params = {'figsize':(15,5), 'color':[ku_clr_dic[c] for c in ku.columns]}

ku.plot(**params)

<matplotlib.axes._subplots.AxesSubplot at 0xb8048d0>

ku.cumsum().plot(**params)

<matplotlib.axes._subplots.AxesSubplot at 0xb190cf8>

ku_y = pd.concat([ku[str(i)].cumsum() for i in sorted(list(set(ku.index.year)))])
ku_y.plot(lw=1, **params)

<matplotlib.axes._subplots.AxesSubplot at 0xbd54240>

p = max(ku.quantile(0.995).max(), -ku.quantile(0.05).min())
xlim = (-p, p)
ku.plot(kind='kde', lw=1, xlim=xlim, **params)

<matplotlib.axes._subplots.AxesSubplot at 0xc08c1d0>

p = ku.abs().quantile(0.99).max()
ku.abs().plot(kind='kde', lw=1, xlim=(0,p), **params)

<matplotlib.axes._subplots.AxesSubplot at 0xc068630>

sns.pairplot(ku)

<seaborn.axisgrid.PairGrid at 0xdafc198>

n = 30000
data = DataFrame(
    (np.random.randn(n)/1000).cumsum()+100,
    index=pd.date_range(end=datetime.datetime.now().date(),periods=n, freq='s')
)
data.plot(figsize=(15,5))

def candle(df, size=(15,5)):
    # ローソク足を表示する 重い
    from matplotlib.finance import candlestick_ohlc
    df = df.copy()
    plt.figure(figsize=size)
    df['idx'] = range(df.index.size)
    ax = plt.subplot()
    candlestick_ohlc(ax, df['idx o h l c'.split()].values, width=0.8, colorup='forestgreen', colordown='brown')
    labelstep = max([1, int(df.index.size/15)])
    ax.set_xticks(df['idx'][::labelstep])
    ax.set_xticklabels(map(lambda x: str(x)[:10], df.index[::labelstep]), rotation=45, fontsize=8)
    ax.set_xlim(left=0)
    df.drop('idx', axis=1, inplace=True)

ohlc_data = data.resample('5min').agg('ohlc')
ohlc_data.columns = 'o h l c'.split()
candle(ohlc_data)

	EURUSD					GBPUSD					...	USDCHF					USDCAD
	o	h	l	c	v	o	h	l	c	v	...	o	h	l	c	v	o	h	l	c	v
t
2016-05-20 19:00:00	1.12058	1.12140	1.12053	1.12119	3392.0	1.45101	1.45168	1.45037	1.45136	5025.0	...	0.99191	0.99202	0.99076	0.99122	960.0	1.31342	1.31349	1.31173	1.31272	2042.0
2016-05-20 20:00:00	1.12118	1.12250	1.12103	1.12208	3141.0	1.45137	1.45223	1.45107	1.45177	3632.0	...	0.99122	0.99131	0.98946	0.98969	973.0	1.31276	1.31320	1.31120	1.31193	1575.0
2016-05-20 21:00:00	1.12207	1.12273	1.12173	1.12183	2411.0	1.45175	1.45220	1.45027	1.45036	3074.0	...	0.98970	0.99071	0.98941	0.99060	871.0	1.31193	1.31336	1.31157	1.31327	1557.0
2016-05-20 22:00:00	1.12185	1.12209	1.12121	1.12157	2689.0	1.45036	1.45047	1.44847	1.44899	3619.0	...	0.99059	0.99117	0.99038	0.99076	509.0	1.31324	1.31347	1.31195	1.31195	1135.0
2016-05-20 23:00:00	1.12157	1.12205	1.12131	1.12141	816.0	1.44899	1.44989	1.44883	1.44958	966.0	...	0.99077	0.99087	0.99033	0.99051	324.0	1.31187	1.31210	1.31090	1.31146	419.0

	EURUSD	GBPUSD	USDJPY	EURJPY	GBPJPY	EURGBP	AUDUSD	USDCHF	USDCAD
	c	c	c	c	c	c	c	c	c
t
2016-05-16	1.13187	1.43970	109.005	123.392	156.950	0.78582	0.72869	0.97745	1.28918
2016-05-17	1.13099	1.44599	109.108	123.420	157.785	0.78192	0.73214	0.98063	1.29100
2016-05-18	1.12144	1.45956	110.185	123.576	160.837	0.76781	0.72268	0.98736	1.30265
2016-05-19	1.12016	1.46079	109.942	123.165	160.616	0.76576	0.72265	0.99028	1.30916
2016-05-20	1.12141	1.44958	110.097	123.502	159.659	0.77321	0.72137	0.99051	1.31146

	AUD	CAD	CHF	EUR	GBP	JPY	USD
t
2016-05-16	0.002484	0.003392	-0.003574	0.000793	0.002360	-0.004845	-0.000610
2016-05-17	0.005060	-0.002096	-0.004240	-0.001358	0.004636	-0.001552	-0.000450
2016-05-18	-0.008874	-0.004182	-0.001681	-0.003595	0.017196	-0.005161	0.006298
2016-05-19	0.000963	-0.004804	-0.002433	-0.000320	0.001995	0.003588	0.001012
2016-05-20	-0.000109	-0.000088	0.001689	0.003261	-0.007028	0.000316	0.001960

	t	o	h	l	c	v
0	1463752800	110.343	110.439	110.327	110.335	3587
1	1463756400	110.335	110.402	110.266	110.331	5100
2	1463760000	110.332	110.483	110.278	110.474	7081
3	1463763600	110.470	110.578	110.414	110.454	6775
4	1463767200	110.449	110.555	110.446	110.524	4732
5	1463770800	110.525	110.531	110.426	110.481	3324
6	1463774400	110.481	110.490	110.124	110.177	4943
7	1463778000	110.178	110.241	110.071	110.228	3519
8	1463781600	110.227	110.227	110.098	110.156	2782
9	1463785200	110.155	110.205	110.068	110.097	1160