mirror of
https://github.com/microsoft/qlib.git
synced 2026-07-03 11:00:57 +08:00
139 lines
4.9 KiB
Python
139 lines
4.9 KiB
Python
import pandas as pd
|
|
import numpy as np
|
|
from gym.spaces import Discrete, Box, Tuple, MultiDiscrete
|
|
import math
|
|
import json
|
|
|
|
|
|
class BaseObs(object):
|
|
""" """
|
|
|
|
def __init__(self, config):
|
|
self._observation_space = None
|
|
|
|
def get_space(self):
|
|
""" """
|
|
return self._observation_space
|
|
|
|
def get_obs(self, t):
|
|
pass
|
|
|
|
|
|
class RuleObs(BaseObs):
|
|
"""The observation for minute-level rule-based agents, which consists of prediction, private state and direction information."""
|
|
|
|
def __init__(self, config):
|
|
feature_size = 0
|
|
self.features = config["features"]
|
|
self.time_interval = config["time_interval"]
|
|
self.max_step_num = config["max_step_num"]
|
|
for feature in self.features:
|
|
feature_size += feature["size"]
|
|
|
|
self._observation_space = Tuple(
|
|
(
|
|
Box(-np.inf, np.inf, shape=(feature_size,), dtype=np.float32),
|
|
Box(-np.inf, np.inf, shape=(4,), dtype=np.float32),
|
|
Discrete(2),
|
|
)
|
|
)
|
|
|
|
def __call__(self, *args, **kargs):
|
|
return self.get_obs(*args, **kargs)
|
|
|
|
def get_feature_res(self, df_list, time, interval, whole_day=False, interval_num=8):
|
|
"""
|
|
This method would extract the needed feature from the feature dataframe based on the feature name
|
|
and the description in feature config.
|
|
|
|
:param df_list: The dataframes of features, the order is consistent with the feature list.
|
|
:param time: The index of current minute of the day (starting from -1).
|
|
:param interval: The index of interval or decition making.
|
|
:param whole_day: if True, this method would return the concatenate of all dataframe.(Default value = False)
|
|
|
|
"""
|
|
predictions = []
|
|
if whole_day:
|
|
try:
|
|
prediction = [df_list[i].reshape(-1) for i in range(len(df_list))]
|
|
except:
|
|
prediction = [df_list[i].reshape(-1) for i in range(len(df_list))]
|
|
for i, p in enumerate(prediction):
|
|
if len(p) < interval_num:
|
|
prediction[i] = np.concatenate((p, np.zeros(interval_num - len(p))), axis=-1)
|
|
# res = np.stack(prediction).transpose().reshape(-1)
|
|
return np.concatenate(prediction)
|
|
for i in range(len(self.features)):
|
|
feature = self.features[i]
|
|
df = df_list[i]
|
|
size = feature["size"]
|
|
if feature["type"] == "inday":
|
|
if time == -1:
|
|
predictions += [0.0] * size
|
|
else:
|
|
predictions += df.iloc[size * time : size * (time + 1)].reshape(-1).tolist()
|
|
elif feature["type"] == "daily":
|
|
predictions += df.reshape(-1)[:size].tolist()
|
|
elif feature["type"] == "range":
|
|
# if feature.startswith('oracle'):
|
|
# predictions += df.iloc[:, (time + 1) : size + (time + 1)].reshape(-1).tolist()
|
|
if time == -1:
|
|
predictions += [0.0] * size
|
|
else:
|
|
predictions += df.iloc[time : size + time].reshape(-1).tolist()
|
|
elif feature["type"] == "interval":
|
|
if len(df.iloc[interval * size : (interval + 1) * size].reshape(-1)) == size:
|
|
predictions += df.iloc[interval * size : (interval + 1) * size].reshape(-1).tolist()
|
|
else:
|
|
predictions += [0.0] * size
|
|
elif feature["type"] == "step":
|
|
if len(df.iloc[size * (time + 1) : size * (time + 2)].reshape(-1)) == size:
|
|
predictions += df.iloc[size * (time + 1) : size * (time + 2)].reshape(-1).tolist()
|
|
else:
|
|
predictions += [0.0] * size
|
|
|
|
return np.array(predictions)
|
|
|
|
def get_obs(self, raw_df, feature_dfs, t, interval, position, target, is_buy, *args, **kargs):
|
|
private_state = np.array([position, target, t, self.max_step_num])
|
|
prediction_state = self.get_feature_res(feature_dfs, t, interval)
|
|
return {
|
|
"prediction": prediction_state,
|
|
"private": private_state,
|
|
"is_buy": int(is_buy),
|
|
}
|
|
|
|
|
|
class RuleInterval(RuleObs):
|
|
"""
|
|
The observation for interval_level rule based strategy.
|
|
|
|
Consist of interval prediction, private state, direction
|
|
|
|
|
|
"""
|
|
|
|
def get_obs(
|
|
self,
|
|
raw_df,
|
|
feature_dfs,
|
|
t,
|
|
interval,
|
|
position,
|
|
target,
|
|
is_buy,
|
|
max_step_num,
|
|
interval_num,
|
|
action=1.0,
|
|
*args,
|
|
**kargs
|
|
):
|
|
private_state = np.array([position, target, interval - 1, interval_num])
|
|
prediction_state = self.get_feature_res(feature_dfs, t, interval)
|
|
return {
|
|
"prediction": prediction_state,
|
|
"private": private_state,
|
|
"is_buy": int(is_buy),
|
|
"action": action,
|
|
}
|