1
0
mirror of https://github.com/microsoft/qlib.git synced 2026-07-04 19:41:00 +08:00

init commit

This commit is contained in:
Young
2020-09-22 01:43:21 +00:00
parent aa51e5aad3
commit 99ebd87cba
131 changed files with 20218 additions and 0 deletions

View File

@@ -0,0 +1,2 @@
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT License.

View File

@@ -0,0 +1,152 @@
# cython: profile=False
# cython: boundscheck=False, wraparound=False, cdivision=True
cimport cython
cimport numpy as np
import numpy as np
from libc.math cimport sqrt, isnan, NAN
from libcpp.vector cimport vector
cdef class Expanding(object):
"""1-D array expanding"""
cdef vector[double] barv
cdef int na_count
def __init__(self):
self.na_count = 0
cdef double update(self, double val):
pass
cdef class Mean(Expanding):
"""1-D array expanding mean"""
cdef double vsum
def __init__(self):
super(Mean, self).__init__()
self.vsum = 0
cdef double update(self, double val):
self.barv.push_back(val)
if isnan(val):
self.na_count += 1
else:
self.vsum += val
return self.vsum / (self.barv.size() - self.na_count)
cdef class Slope(Expanding):
"""1-D array expanding slope"""
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double xy_sum
def __init__(self):
super(Slope, self).__init__()
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
cdef size_t size = self.barv.size()
if isnan(val):
self.na_count += 1
else:
self.x_sum += size
self.x2_sum += size * size
self.y_sum += val
self.xy_sum += size * val
cdef int N = size - self.na_count
return (N*self.xy_sum - self.x_sum*self.y_sum) / \
(N*self.x2_sum - self.x_sum*self.x_sum)
cdef class Resi(Expanding):
"""1-D array expanding residuals"""
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double xy_sum
def __init__(self):
super(Resi, self).__init__()
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
cdef size_t size = self.barv.size()
if isnan(val):
self.na_count += 1
else:
self.x_sum += size
self.x2_sum += size * size
self.y_sum += val
self.xy_sum += size * val
cdef int N = size - self.na_count
slope = (N*self.xy_sum - self.x_sum*self.y_sum) / \
(N*self.x2_sum - self.x_sum*self.x_sum)
x_mean = self.x_sum / N
y_mean = self.y_sum / N
interp = y_mean - slope*x_mean
return val - (slope*size + interp)
cdef class Rsquare(Expanding):
"""1-D array expanding rsquare"""
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double y2_sum
cdef double xy_sum
def __init__(self):
super(Rsquare, self).__init__()
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.y2_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
cdef size_t size = self.barv.size()
if isnan(val):
self.na_count += 1
else:
self.x_sum += size
self.x2_sum += size
self.y_sum += val
self.y2_sum += val * val
self.xy_sum += size * val
cdef int N = size - self.na_count
cdef double rvalue = (N*self.xy_sum - self.x_sum*self.y_sum) / \
sqrt((N*self.x2_sum - self.x_sum*self.x_sum) * (N*self.y2_sum - self.y_sum*self.y_sum))
return rvalue * rvalue
cdef np.ndarray[double, ndim=1] expanding(Expanding r, np.ndarray a):
cdef int i
cdef int N = len(a)
cdef np.ndarray[double, ndim=1] ret = np.empty(N)
for i in range(N):
ret[i] = r.update(a[i])
return ret
def expanding_mean(np.ndarray a):
cdef Mean r = Mean()
return expanding(r, a)
def expanding_slope(np.ndarray a):
cdef Slope r = Slope()
return expanding(r, a)
def expanding_rsquare(np.ndarray a):
cdef Rsquare r = Rsquare()
return expanding(r, a)
def expanding_resi(np.ndarray a):
cdef Resi r = Resi()
return expanding(r, a)

207
qlib/data/_libs/rolling.pyx Normal file
View File

@@ -0,0 +1,207 @@
# cython: profile=False
# cython: boundscheck=False, wraparound=False, cdivision=True
cimport cython
cimport numpy as np
import numpy as np
from libc.math cimport sqrt, isnan, NAN
from libcpp.deque cimport deque
cdef class Rolling(object):
"""1-D array rolling"""
cdef int window
cdef deque[double] barv
cdef int na_count
def __init__(self, int window):
self.window = window
self.na_count = window
cdef int i
for i in range(window):
self.barv.push_back(NAN)
cdef double update(self, double val):
pass
cdef class Mean(Rolling):
"""1-D array rolling mean"""
cdef double vsum
def __init__(self, int window):
super(Mean, self).__init__(window)
self.vsum = 0
cdef double update(self, double val):
self.barv.push_back(val)
if not isnan(self.barv.front()):
self.vsum -= self.barv.front()
else:
self.na_count -= 1
self.barv.pop_front()
if isnan(val):
self.na_count += 1
# return NAN
else:
self.vsum += val
return self.vsum / (self.window - self.na_count)
cdef class Slope(Rolling):
"""1-D array rolling slope"""
cdef double i_sum # can be used as i2_sum
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double xy_sum
def __init__(self, int window):
super(Slope, self).__init__(window)
self.i_sum = 0
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
self.xy_sum = self.xy_sum - self.y_sum
self.x2_sum = self.x2_sum + self.i_sum - 2*self.x_sum
self.x_sum = self.x_sum - self.i_sum
cdef double _val
_val = self.barv.front()
if not isnan(_val):
self.i_sum -= 1
self.y_sum -= _val
else:
self.na_count -= 1
self.barv.pop_front()
if isnan(val):
self.na_count += 1
# return NAN
else:
self.i_sum += 1
self.x_sum += self.window
self.x2_sum += self.window * self.window
self.y_sum += val
self.xy_sum += self.window * val
cdef int N = self.window - self.na_count
return (N*self.xy_sum - self.x_sum*self.y_sum) / \
(N*self.x2_sum - self.x_sum*self.x_sum)
cdef class Resi(Rolling):
"""1-D array rolling residuals"""
cdef double i_sum # can be used as i2_sum
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double xy_sum
def __init__(self, int window):
super(Resi, self).__init__(window)
self.i_sum = 0
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
self.xy_sum = self.xy_sum - self.y_sum
self.x2_sum = self.x2_sum + self.i_sum - 2*self.x_sum
self.x_sum = self.x_sum - self.i_sum
cdef double _val
_val = self.barv.front()
if not isnan(_val):
self.i_sum -= 1
self.y_sum -= _val
else:
self.na_count -= 1
self.barv.pop_front()
if isnan(val):
self.na_count += 1
# return NAN
else:
self.i_sum += 1
self.x_sum += self.window
self.x2_sum += self.window * self.window
self.y_sum += val
self.xy_sum += self.window * val
cdef int N = self.window - self.na_count
slope = (N*self.xy_sum - self.x_sum*self.y_sum) / \
(N*self.x2_sum - self.x_sum*self.x_sum)
x_mean = self.x_sum / N
y_mean = self.y_sum / N
interp = y_mean - slope*x_mean
return val - (slope*self.window + interp)
cdef class Rsquare(Rolling):
"""1-D array rolling rsquare"""
cdef double i_sum
cdef double x_sum
cdef double x2_sum
cdef double y_sum
cdef double y2_sum
cdef double xy_sum
def __init__(self, int window):
super(Rsquare, self).__init__(window)
self.i_sum = 0
self.x_sum = 0
self.x2_sum = 0
self.y_sum = 0
self.y2_sum = 0
self.xy_sum = 0
cdef double update(self, double val):
self.barv.push_back(val)
self.xy_sum = self.xy_sum - self.y_sum
self.x2_sum = self.x2_sum + self.i_sum - 2*self.x_sum
self.x_sum = self.x_sum - self.i_sum
cdef double _val
_val = self.barv.front()
if not isnan(_val):
self.i_sum -= 1
self.y_sum -= _val
self.y2_sum -= _val * _val
else:
self.na_count -= 1
self.barv.pop_front()
if isnan(val):
self.na_count += 1
# return NAN
else:
self.i_sum += 1
self.x_sum += self.window
self.x2_sum += self.window * self.window
self.y_sum += val
self.y2_sum += val * val
self.xy_sum += self.window * val
cdef int N = self.window - self.na_count
cdef double rvalue
rvalue = (N*self.xy_sum - self.x_sum*self.y_sum) / \
sqrt((N*self.x2_sum - self.x_sum*self.x_sum) * (N*self.y2_sum - self.y_sum*self.y_sum))
return rvalue * rvalue
cdef np.ndarray[double, ndim=1] rolling(Rolling r, np.ndarray a):
cdef int i
cdef int N = len(a)
cdef np.ndarray[double, ndim=1] ret = np.empty(N)
for i in range(N):
ret[i] = r.update(a[i])
return ret
def rolling_mean(np.ndarray a, int window):
cdef Mean r = Mean(window)
return rolling(r, a)
def rolling_slope(np.ndarray a, int window):
cdef Slope r = Slope(window)
return rolling(r, a)
def rolling_rsquare(np.ndarray a, int window):
cdef Rsquare r = Rsquare(window)
return rolling(r, a)
def rolling_resi(np.ndarray a, int window):
cdef Resi r = Resi(window)
return rolling(r, a)