unstable commit to allow sync with qexec master to move db code

2026-06-30 09:02:58 +08:00 · 2012-02-26 20:28:08 -05:00
parent f29c83e941
commit e94c8cf717
4 changed files with 282 additions and 114 deletions
@@ -0,0 +1,272 @@
+import datetime
+import quantoenv
+import math
+import pytz
+import numpy as np
+import numpy.linalg as la
+from pymongo import ASCENDING, DESCENDING
+
+class daily_return():
+    
+    def __init__(self, date, returns):
+        self.date = date
+        self.returns = returns
+        
+class periodmetrics():
+    def __init__(self, start_date, end_date, returns, benchmark_returns):
+        self.start_date = start_date
+        self.end_date = end_date
+        self.trading_calendar = trading_calendar
+        self.algorithm_period_returns, self.algorithm_returns = self.calculate_period_returns(returns)
+        self.benchmark_period_returns, self.benchmark_returns = self.calculate_period_returns(benchmark_returns)
+        if(len(self.benchmark_returns) != len(self.algorithm_returns)):
+            raise Exception("Mismatch between benchmark_returns ({bm_count}) and algorithm_returns ({algo_count}) in range {start} : {end}".format(
+                                                                                                                     bm_count=len(self.benchmark_returns),
+                                                                                                                     algo_count=len(self.algorithm_returns),
+                                                                                                                     start=start_date, 
+                                                                                                                     end=end_date))
+        self.trading_days = len(self.benchmark_returns)
+        self.benchmark_volatility = self.calculate_volatility(self.benchmark_returns)
+        self.algorithm_volatility = self.calculate_volatility(self.algorithm_returns)
+        self.treasury_period_return = self.choose_treasury()
+        self.sharpe = self.calculate_sharpe()
+        self.beta, self.algorithm_covariance, self.benchmark_variance, self.condition_number, self.eigen_values = self.calculate_beta()
+        self.alpha = self.calculate_alpha()
+        self.excess_return = self.algorithm_period_returns - self.treasury_period_return
+        self.max_drawdown = self.calculate_max_drawdown()
+        
+    def __repr__(self):
+        statements = []
+        for metric in ["algorithm_period_returns", "benchmark_period_returns", "excess_return", "trading_days", "benchmark_volatility", "algorithm_volatility", "sharpe", "algorithm_covariance", "benchmark_variance", "beta", "alpha", "max_drawdown", "algorithm_returns", "benchmark_returns", "condition_number", "eigen_values"]:
+            value = getattr(self, metric)
+            statements.append("{metric}:{value}".format(metric=metric, value=value))
+        
+        return '\n'.join(statements)
+        
+    def calculate_period_returns(self, daily_returns):
+        returns = [x.returns for x in daily_returns if x.date >= self.start_date and x.date <= self.end_date and self.trading_calendar.is_trading_day(x.date)]
+        #quantoenv.qlogger.debug("using {count} daily returns out of {total}".format(count=len(returns),total=len(daily_returns)))
+        period_returns = 1.0
+        for r in returns:
+            period_returns = period_returns * (1.0 + r)
+        period_returns = period_returns - 1.0
+        return period_returns, returns
+        
+    def calculate_volatility(self, daily_returns):
+        #quantoenv.qlogger.debug("trading days {td}".format(td=self.trading_days))
+        return np.std(daily_returns, ddof=1) * math.sqrt(self.trading_days)
+        
+    def calculate_sharpe(self):
+        return (self.algorithm_period_returns - self.treasury_period_return) / self.algorithm_volatility
+        
+    def calculate_beta(self):
+        #quantoenv.qlogger.debug("algorithm has {acount} days, benchmark has {bmcount} days".format(acount=len(self.algorithm_returns), bmcount=len(self.benchmark_returns)))
+        #it doesn't make much sense to calculate beta for less than two days, so return none.
+        if len(self.algorithm_returns) < 2:
+            return 0.0, 0.0, 0.0, 0.0, []
+        returns_matrix = np.vstack([self.algorithm_returns, self.benchmark_returns])
+        C = np.cov(returns_matrix)
+        eigen_values = la.eigvals(C)
+        condition_number = max(eigen_values) / min(eigen_values)
+        algorithm_covariance = C[0][1]
+        benchmark_variance = C[1][1]
+        beta = C[0][1] / C[1][1]
+        #quantoenv.qlogger.debug("bm variance is {bmv}, returns matrix is {rm}, covariance is {c}, beta is {beta}".format(rm=returns_matrix, bmv=C[1][1], c=C, beta=beta))
+        
+        return beta, algorithm_covariance, benchmark_variance, condition_number, eigen_values
+        
+    def calculate_alpha(self):
+        return self.algorithm_period_returns - (self.treasury_period_return + self.beta * (self.benchmark_period_returns - self.treasury_period_return))
+        
+    def calculate_max_drawdown(self):
+        compounded_returns = []
+        cur_return = 0.0
+        for r in self.algorithm_returns:
+            if(r != -1.0):
+                cur_return = math.log(1.0 + r) + cur_return
+            #this is a guard for a single day returning -100%
+            else:
+                quantoenv.qlogger.warn("negative 100 percent return, zeroing the returns")
+                cur_return = 0.0
+            compounded_returns.append(cur_return)
+            
+        #quantoenv.qlogger.debug("compounded returns are {cr}".format(cr=compounded_returns))
+        cur_max = None
+        max_drawdown = None
+        for cur in compounded_returns:
+            if cur_max == None or cur > cur_max:
+                cur_max = cur
+            
+            drawdown = (cur - cur_max)
+            if max_drawdown == None or drawdown < max_drawdown:
+                max_drawdown = drawdown
+        
+        #quantoenv.qlogger.debug("max drawdown is: {dd}".format(dd=max_drawdown))
+        if max_drawdown == None:
+            return 0.0
+            
+        return 1.0 - math.exp(max_drawdown)
+        
+    
+    def choose_treasury(self):
+        td = self.end_date - self.start_date
+        if td.days <= 31:
+            self.treasury_duration = '1month'
+        elif td.days <= 93:
+            self.treasury_duration = '3month'
+        elif td.days <= 186:
+            self.treasury_duration = '6month'
+        elif td.days <= 366:
+            self.treasury_duration = '1year'
+        elif td.days <= 365 * 2 + 1:
+            self.treasury_duration = '2year'
+        elif td.days <= 365 * 3 + 1:
+            self.treasury_duration = '3year'
+        elif td.days <= 365 * 5 + 2:
+            self.treasury_duration = '5year'
+        elif td.days <= 365 * 7 + 2:
+            self.treasury_duration = '7year'
+        elif td.days <= 365 * 10 + 2:
+            self.treasury_duration = '10year'
+        else:
+            self.treasury_duration = '30year'
+        
+        treasuryQS = quantoenv.getTickDB().treasury_curves.find(
+                                                            spec={"date" : {"$lte" : self.end_date}},
+                                                            sort=[("date",DESCENDING)],
+                                                            limit=3,
+                                                            slave_ok=True)
+    
+        for curve in treasuryQS:
+            self.treasury_curve = curve
+            rate = self.treasury_curve[self.treasury_duration]
+            #1month note data begins in 8/2001, so we can use 3month instead.
+            if rate == None and self.treasury_duration == '1month':
+                rate = self.treasury_curve['3month']
+            if rate != None:
+                return rate * (td.days + 1) / 365
+
+        raise Exception("no rate for end date = {dt} and term = {term}, from {curve}. Using zero.".format(dt=self.end_date, 
+                                                                                                          term=self.treasury_duration, 
+                                                                                                          curve=self.treasury_curve['date']))
+        
+class riskmetrics():
+    
+    def __init__(self, algorithm_returns):
+        """algorithm_returns needs to be a list of daily_return objects sorted in date ascending order"""
+        self.db = quantoenv.getTickDB()
+        self.algorithm_returns = algorithm_returns
+        self.bm_returns = [x for x in benchmark_returns if x.date >= self.algorithm_returns[0].date and x.date <= self.algorithm_returns[-1].date]
+        
+        quantoenv.qlogger.debug("#### {start} thru {end} with {count} trading_days of {total} possible".format(start=self.algorithm_returns[0].date, 
+                                                                                           end=self.algorithm_returns[-1].date,
+                                                                                           count=len(self.bm_returns),
+                                                                                           total=len(benchmark_returns)))
+        
+        #calculate month ends
+        self.month_periods          = self.periodsInRange(1, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        #calculate 3 month ends
+        self.three_month_periods    = self.periodsInRange(3, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        #calculate 6 month ends
+        self.six_month_periods      = self.periodsInRange(6, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        #calculate 1 year ends
+        self.year_periods           = self.periodsInRange(12, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        #calculate 3 year ends
+        self.three_year_periods     = self.periodsInRange(36, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        #calculate 5 year ends
+        self.five_year_periods      = self.periodsInRange(60, self.algorithm_returns[0].date, self.algorithm_returns[-1].date)
+        
+        
+    def periodsInRange(self, months_per, start, end):
+        one_day = datetime.timedelta(days = 1)
+        ends = []
+        cur_start = start.replace(day=1)
+        #ensure that we have an end at the end of a calendar month, in case the return series ends mid-month...
+        the_end = advance_by_months(end.replace(day=1),1) - one_day
+        while True:
+            cur_end = advance_by_months(cur_start, months_per) - one_day
+            if(cur_end > the_end):
+                break
+            #quantoenv.qlogger.debug("start: {start}, end: {end}".format(start=cur_start, end=cur_end))
+            cur_period_metrics = periodmetrics(start_date=cur_start, end_date=cur_end, returns=self.algorithm_returns, benchmark_returns=self.bm_returns)
+            ends.append(cur_period_metrics)
+            cur_start = advance_by_months(cur_start, 1)
+            
+        return ends
+        
+    def store_to_db(self, back_test_run_id):
+        col = quantoenv.getTickDB().risk_metrics
+        for period in self.month_periods:
+            for metric in ["algorithm_period_returns", "benchmark_period_returns", "excess_return", "trading_days", "benchmark_volatility", "algorithm_volatility", "sharpe", "beta", "alpha", "max_drawdown"]:
+                record = {'back_test_run_id':back_test_run_id}
+                record['ending_on']     = period.end_date
+                record['metric_name']   = metric
+                for dur in ["month", "three_month", "six_month", "year", "three_year", "five_year"]:
+                    record[dur] = self.find_metric_by_end(period.end_date, dur, metric)
+                    #quantoenv.qlogger.debug("storing {val} for {metric} and {dur}".format(val=record[dur], metric=metric, dur=dur))
+                col.insert(record, safe=True)
+    
+    def find_metric_by_end(self, end_date, duration, metric):
+        col = getattr(self, duration + "_periods")
+        col = [getattr(x, metric) for x in col if x.end_date == end_date]
+        if len(col) == 1:
+            return col[0]
+        return None
+        
+def advance_by_months(dt, jump_in_months):
+    month = dt.month + jump_in_months
+    years = month / 12
+    month = month % 12 
+
+    #no remainder means that we are landing in december.
+    #modulo is, in a way, a zero indexed circular array. 
+    #this is a way of converting to 1 indexed months. (in our modulo index, december is zeroth)
+    if(month == 0):
+        month = 12
+        years = years - 1
+    
+    r = dt.replace(year = dt.year + years, month = month)
+    return r
+
+class TradingCalendar(object):
+
+    def __init__(self, benchmark_returns):
+        self.trading_days = []
+        self.trading_day_map = {}
+        for bm in benchmark_returns:
+            self.trading_days.append(bm.date)
+            self.trading_day_map[bm.date] = bm
+    
+    def normalize_date(self, test_date):
+        return datetime.datetime(year=test_date.year, month=test_date.month, day=test_date.day, tzinfo=pytz.utc)
+     
+    def is_trading_day(self, test_date):
+        dt = self.normalize_date(test_date)
+        return self.trading_day_map.has_key(dt)
+    
+    def get_benchmark_daily_return(self, test_date):
+        date = self.normalize_date(test_date)
+        if self.trading_day_map.has_key(date):
+            return self.trading_day_map[date].returns
+        else:
+            return 0.0
+
+       
+def get_benchmark_data():
+    bmQS = quantoenv.getTickDB().bench_marks.find(
+                                 spec={"symbol" : "GSPC", 
+                                        "date":{"$gte": quantoenv.getUTCFromExchangeTime(datetime.datetime.strptime('01/01/1990','%m/%d/%Y')), 
+                                                "$lte": quantoenv.getUTCFromExchangeTime(datetime.datetime.strptime('12/31/2010','%m/%d/%Y'))}},
+                                 sort=[("date",ASCENDING)],
+                                 slave_ok=True,
+                                 as_class=quantoenv.DocWrap)
+    bm_returns = []
+    for bm in bmQS:
+        bm_r = daily_return(date=bm.date.replace(tzinfo=pytz.utc), returns=bm.returns)
+        bm_returns.append(bm_r)    
+
+    cal = TradingCalendar(bm_returns)
+    return bm_returns, cal
+
+benchmark_returns, trading_calendar = get_benchmark_data() 
+    
@@ -1,107 +0,0 @@
-import datetime
-import pytz
-from algorithm.quantoenv import *
-from algorithm.quantomodels import *
-from algorithm.hostedalgorithm import *
-from algorithm.risk import *
-
-def createReturns(daycount, start):
-    i = 0
-    test_range = []
-    current = start.replace(tzinfo=pytz.utc)
-    one_day = datetime.timedelta(days = 1)
-    while i < daycount: 
-        i += 1
-        r = daily_return(current, random.random())
-        test_range.append(r)
-        current = current + one_day
-    return [ x for x in test_range if(trading_calendar.is_trading_day(x.date)) ]
-
-def createReturnsFromRange(start, end):
-    current = start.replace(tzinfo=pytz.utc)
-    end = end.replace(tzinfo=pytz.utc)
-    one_day = datetime.timedelta(days = 1)
-    test_range = []
-    i = 0
-    while current <= end: 
-        current = current + one_day
-        if(not trading_calendar.is_trading_day(current)):
-            continue
-        r = daily_return(current, random.random())
-        i += 1
-        test_range.append(r)
-        
-    return test_range
-def createReturnsFromList(returns, start):
-    current = start.replace(tzinfo=pytz.utc)
-    one_day = datetime.timedelta(days = 1)
-    test_range = []
-    i = 0
-    while len(test_range) < len(returns): 
-        if(trading_calendar.is_trading_day(current)):
-            r = daily_return(current, returns[i])
-            i += 1
-            test_range.append(r)
-        current = current + one_day
-    return test_range
-    
-
-def createAlgo(filename):
-    algo = Algorithm()
-    algo.code = getCodeFromFile(filename)
-    algo.title = filename
-    algo._id = pymongo.objectid.ObjectId()
-    hostedAlgo = HostedAlgorithm(algo)
-    return hostedAlgo       
-    
-def getCodeFromFile(filename):
-    rVal = None
-    with open('./test/algo_samples/' + filename, 'r') as f:
-        rVal = f.read()
-    return rVal
-    
-                          
-def createTrade(sid, price, amount, datetime):
-    row = {}
-    row['sid'] = sid
-    row['dt'] = datetime
-    row['price'] = price
-    row['volume'] = amount
-    row['exchange_code'] = "fake exchange"
-    db = getTickDB()
-    db.equity.trades.minute.insert(row,safe=True)
-    dw = DocWrap()
-    dw.store = row
-    return dw
- 
-def createTradeHistory(sid, priceList, amtList, startTime, interval):
-    i = 0
-    trades = []
-    current = startTime
-    while i < len(priceList):
-        if(trading_calendar.is_trading_day(current)):  
-            trades.append(createTrade(sid, priceList[i], amtList[i], current))
-            current = current + interval
-            i += 1
-        else:
-            current = current + datetime.timedelta(days=1)
-        
-    return trades 
-    
-def createTxn(sid, price, amount, datetime, btrid=None):
-    txn = Transaction(sid=sid, amount=amount, dt = datetime, 
-                      price=price, transaction_cost=-1*price*amount)
-    return txn
-    
-def createTxnHistory(sid, priceList, amtList, startTime, interval):
-    i = 0
-    txns = []
-    current = startTime
-    while i < len(priceList):
-        if(trading_calendar.is_trading_day(current)): 
-            txns.append(createTxn(sid,priceList[i],amtList[i], current))
-            current = current + interval
-            i += 1
-        else:
-            current = current + datetime.timedelta(days=1) 
-    return txns
@@ -74,11 +74,11 @@ def createTrade(sid, price, amount, datetime):
    dw.store = row
    return dw
 
-def createTradeHistory(sid, priceList, amtList, startTime, interval):
+def create_trade_history(sid, prices, amounts, start_time, interval):
    i = 0
    trades = []
-    current = startTime
-    while i < len(priceList):
+    current = start_time
+    while i < len(prices):
        if(trading_calendar.is_trading_day(current)):  
            trades.append(createTrade(sid, priceList[i], amtList[i], current))
            current = current + interval
@@ -2,6 +2,7 @@
 from unittest2 import TestCase

 from zipline.test.test_messaging import SimulatorTestCase
+import zipline.test.factory as factory
 from zipline.monitor import Controller
 from zipline.messaging import DataSource
 import zipline.util as qutil
@@ -56,7 +57,11 @@ class ThreadPoolExecutor(SimulatorTestCase, TestCase):
        # Simulation Components
        # ---------------------

-        ret1 = RandomEquityTrades(133, "ret1", 5000)
+        ret1 = SpecificEquityTrades("flat-133",factory.create_trade_history(133,    
+                                                                            [10.0,11.0,10.0,10.0], 
+                                                                            [100,100,100,100], 
+                                                                            datetime.datetime.utcnow(), 
+                                                                            datetime.timedelta(days=1)))
        ret2 = RandomEquityTrades(134, "ret2", 5000)
        mavg1 = MovingAverage("mavg1", 30)
        mavg2 = MovingAverage("mavg2", 60)
@@ -80,6 +85,4 @@ class ThreadPoolExecutor(SimulatorTestCase, TestCase):
            "The feed should be drained of all messages, found {n} remaining."
            .format(n=sim.feed.pending_messages())
        )
-        
-
-class PredefinedDataSource()
+