mirror of
https://github.com/microsoft/qlib.git
synced 2026-06-06 05:51:17 +08:00
* MVP for Indian Stocks in qlib using yahooquery * cleaned with black * cleaned with black * add YahooNormalizeIN and YahooNormalizeIN1d * cleaned the code * added 1min for IN and also updated readme * update comments * fix comments * recorder support upload both raw file and directory * fix comments * Update README.md * Fix docs of QlibRecorder * sort index after loader (#538) make sure the fetch method is based on a index-sorted pd.DataFrame * refactor online serving rolling api * refactor TRA * format by black * fix horizon * fix TRA when use single head * clean up * improve pretrain * update README * fix tra when logdir is None * fix tra when logdir is None * Update strategy.py * Update README.md * Update README.md * Conda Suggestion * code standard docs * Update ensemble.py (#560) * Fix CI Bug (#575) Co-authored-by: yuxwang <anduinnn@foxmail.com> * Update gen.py (#576) * Fix multi-process loop calls (#574) * check lexsort in the 'lazy_sort_index' function (#566) * check lexsort * check lexsort * lexsort comment * lexsort comment * Delete .DS_Store * Update README.md * bug fix & use oracle transport pretrain * mend * Add `backend_freq_config` parameter, support multi-freq uri * Add sample_config to QlibDataLoader, support multi-freq * add multi-freq example * get_cls_kwargs renamed get_callable_kwargs * support multi-freq uri * Add inst_processors to D.features * Fix typo * Fix the index type of the multi-freq example * Fix duplicate mlflow directories in tests * Add DataPathManager to QlibConfig && modify inst_processors to supports list only * Modify the default value in the multi_freq example * Modify client-server mode and dataset-cache to disable inst_processor * Add wheel package to github CI * fix comment * Update FAQ.rst * Update README.md Fix wrong link * Update the docs of TaskManager (#586) * Update manage.py * update yaml * update run_all_model * Modify the Feature to be case sensitive (#589) * update README * remove verbose * fix spell bug * fix typos (#592) * Update Release Note * fix portfolio bug * Add calendar support for resample * add freq kwargs * test.yml: Remove redundant code (#595) * Supporting shared processor (#596) * Supporting shared processor * fix readonly reverse bug * remove pytests dependency * with fit bug * fix parameter error * fix comments * Fix undefined names in Python code (#599) * Update pytorch_tabnet.py $ `flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics` ``` ./qlib/qlib/contrib/model/pytorch_tabnet.py:567:38: F821 undefined name 'inp' self.independ.append(GLU(inp, out_dim, vbs=vbs)) ^ ./qlib/examples/model_rolling/task_manager_rolling.py:75:18: F821 undefined name 'task_train' run_task(task_train, self.task_pool, experiment_name=self.experiment_name) ^ 2 F821 undefined name 'task_train' 2 ``` * Fix undefined names in Python code * from qlib.model.trainer import task_train * update seed * fix some docstring * add comments * Fix SimpleDatasetCache * Update setup.py updated classifiers * Update setup.py change to matplotlib==3.3 * Update python-publish.yml added python 3.9 * updategrade version number * Update model list * fix the type of filter_pipe * fix comment * fix record_temp * update cvxpy version * Update code_standard.rst (#587) * Update code_standard.rst * Update docs/developer/code_standard.rst Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> * Add file lock for MLflowExpManager (#619) * fix torch version * Share version number (#620) * Update initialization.rst (#622) * Update initialization.rst * Update docs/start/initialization.rst Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> * Update docs/start/initialization.rst Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> * fix bugs for running previous exmaple * fix deal amount bug * update change doc (#623) * Add files via upload * Update README.md * Update README.md * Update README.md * Delete change doc.gif * Add files via upload * Update README.md * Delete change doc.gif * Add files via upload * Delete change doc.gif * Add files via upload * Update README.md Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> * update doc * simplify run all model * fix run all model bug * Fix Models (#483) * fix gat dataset * fix tft model * Update tft.py * Fix tft.py Co-authored-by: Pengrong Zhu <zhu.pengrong@foxmail.com> * type and skip empty exp * fix model yaml config * fix tft import bug * skip empty result * fix model and yaml bug * fix wrong generate parameter * Modify multi-freq example (#626) * modify the example of multi-freq * add Copyright * add a comment to average_ops.py * modify the example of multi-freq * add comment to multi_freq_handler.py * add the Ref expression description to multi_freq_handler.py * add expression description to multi_freq_handler.py * update images * fix workflow and update framework Co-authored-by: Gaurav <2796gaurav@gmail.com> Co-authored-by: 2796gaurav <17353992+2796gaurav@users.noreply.github.com> Co-authored-by: bxdd <bxd98@126.com> Co-authored-by: Young <afe.young@gmail.com> Co-authored-by: you-n-g <you-n-g@users.noreply.github.com> Co-authored-by: Dong Zhou <Zhou.Dong@microsoft.com> Co-authored-by: ZhangTP1996 <ztp18@mails.tsinghua.edu.cn> Co-authored-by: demon143 <59681577+demon143@users.noreply.github.com> Co-authored-by: Wangwuyi123 <51237097+Wangwuyi123@users.noreply.github.com> Co-authored-by: yuxwang <anduinnn@foxmail.com> Co-authored-by: Pengrong Zhu <zhu.pengrong@foxmail.com> Co-authored-by: Mark Zhao <50850474+markzhao98@users.noreply.github.com> Co-authored-by: cslwqxx <cslwqxx@users.noreply.github.com> Co-authored-by: Dong Zhou <evanzd@users.noreply.github.com> Co-authored-by: SaintMalik <37118134+saintmalik@users.noreply.github.com> Co-authored-by: Christian Clauss <cclauss@me.com> Co-authored-by: Anurag Kumar <mailanu98@gmail.com> Co-authored-by: demon143 <785696300@qq.com>
112 lines
3.9 KiB
Python
112 lines
3.9 KiB
Python
# Copyright (c) Microsoft Corporation.
|
|
# Licensed under the MIT License.
|
|
|
|
"""
|
|
This example shows how a TrainerRM works based on TaskManager with rolling tasks.
|
|
After training, how to collect the rolling results will be shown in task_collecting.
|
|
Based on the ability of TaskManager, `worker` method offer a simple way for multiprocessing.
|
|
"""
|
|
|
|
from pprint import pprint
|
|
|
|
import fire
|
|
import qlib
|
|
from qlib.config import REG_CN
|
|
from qlib.workflow import R
|
|
from qlib.workflow.task.gen import RollingGen, task_generator
|
|
from qlib.workflow.task.manage import TaskManager, run_task
|
|
from qlib.workflow.task.collect import RecorderCollector
|
|
from qlib.model.ens.group import RollingGroup
|
|
from qlib.model.trainer import TrainerRM, task_train
|
|
from qlib.tests.config import CSI100_RECORD_LGB_TASK_CONFIG, CSI100_RECORD_XGBOOST_TASK_CONFIG
|
|
|
|
|
|
class RollingTaskExample:
|
|
def __init__(
|
|
self,
|
|
provider_uri="~/.qlib/qlib_data/cn_data",
|
|
region=REG_CN,
|
|
task_url="mongodb://10.0.0.4:27017/",
|
|
task_db_name="rolling_db",
|
|
experiment_name="rolling_exp",
|
|
task_pool="rolling_task",
|
|
task_config=None,
|
|
rolling_step=550,
|
|
rolling_type=RollingGen.ROLL_SD,
|
|
):
|
|
# TaskManager config
|
|
if task_config is None:
|
|
task_config = [CSI100_RECORD_XGBOOST_TASK_CONFIG, CSI100_RECORD_LGB_TASK_CONFIG]
|
|
mongo_conf = {
|
|
"task_url": task_url,
|
|
"task_db_name": task_db_name,
|
|
}
|
|
qlib.init(provider_uri=provider_uri, region=region, mongo=mongo_conf)
|
|
self.experiment_name = experiment_name
|
|
self.task_pool = task_pool
|
|
self.task_config = task_config
|
|
self.rolling_gen = RollingGen(step=rolling_step, rtype=rolling_type)
|
|
|
|
# Reset all things to the first status, be careful to save important data
|
|
def reset(self):
|
|
print("========== reset ==========")
|
|
TaskManager(task_pool=self.task_pool).remove()
|
|
exp = R.get_exp(experiment_name=self.experiment_name)
|
|
for rid in exp.list_recorders():
|
|
exp.delete_recorder(rid)
|
|
|
|
def task_generating(self):
|
|
print("========== task_generating ==========")
|
|
tasks = task_generator(
|
|
tasks=self.task_config,
|
|
generators=self.rolling_gen, # generate different date segments
|
|
)
|
|
pprint(tasks)
|
|
return tasks
|
|
|
|
def task_training(self, tasks):
|
|
print("========== task_training ==========")
|
|
trainer = TrainerRM(self.experiment_name, self.task_pool)
|
|
trainer.train(tasks)
|
|
|
|
def worker(self):
|
|
# train tasks by other progress or machines for multiprocessing. It is same as TrainerRM.worker.
|
|
print("========== worker ==========")
|
|
run_task(task_train, self.task_pool, experiment_name=self.experiment_name)
|
|
|
|
def task_collecting(self):
|
|
print("========== task_collecting ==========")
|
|
|
|
def rec_key(recorder):
|
|
task_config = recorder.load_object("task")
|
|
model_key = task_config["model"]["class"]
|
|
rolling_key = task_config["dataset"]["kwargs"]["segments"]["test"]
|
|
return model_key, rolling_key
|
|
|
|
def my_filter(recorder):
|
|
# only choose the results of "LGBModel"
|
|
model_key, rolling_key = rec_key(recorder)
|
|
if model_key == "LGBModel":
|
|
return True
|
|
return False
|
|
|
|
collector = RecorderCollector(
|
|
experiment=self.experiment_name,
|
|
process_list=RollingGroup(),
|
|
rec_key_func=rec_key,
|
|
rec_filter_func=my_filter,
|
|
)
|
|
print(collector())
|
|
|
|
def main(self):
|
|
self.reset()
|
|
tasks = self.task_generating()
|
|
self.task_training(tasks)
|
|
self.task_collecting()
|
|
|
|
|
|
if __name__ == "__main__":
|
|
## to see the whole process with your own parameters, use the command below
|
|
# python task_manager_rolling.py main --experiment_name="your_exp_name"
|
|
fire.Fire(RollingTaskExample)
|