Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Sign in
Toggle navigation
A
alpha-mind
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Dr.李
alpha-mind
Commits
a9579e26
Commit
a9579e26
authored
Jan 17, 2019
by
Dr.李
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
added one more quick start
parent
e229caa7
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
316 additions
and
0 deletions
+316
-0
Quick Start 4 - Step By Step Alpha Modeling.ipynb
notebooks/Quick Start 4 - Step By Step Alpha Modeling.ipynb
+316
-0
No files found.
notebooks/Quick Start 4 - Step By Step Alpha Modeling.ipynb
0 → 100644
View file @
a9579e26
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"> 在本文中,我们给出分步骤使用原始的多因子数据,生成目标权重的例子"
]
},
{
"cell_type": "code",
"execution_count": 136,
"metadata": {},
"outputs": [],
"source": [
"%matplotlib inline\n",
"import os\n",
"import numpy as np\n",
"import pandas as pd\n",
"from alphamind.data.dbmodel.models import Uqer\n",
"from alphamind.data.dbmodel.models import Universe\n",
"from alphamind.data.dbmodel.models import Industry\n",
"from alphamind.data.dbmodel.models import IndexComponent\n",
"from alphamind.data import neutralize\n",
"from alphamind.portfolio.linearbuilder import linear_builder\n",
"import sqlalchemy as sa\n",
"from sqlalchemy import outerjoin, and_, select\n",
"from matplotlib import rc\n",
"from matplotlib import pyplot as plt\n",
"\n",
"rc('font', **{'family': 'Microsoft YaHei', 'size': 10})\n",
"rc('mathtext', **{'default': 'regular'})\n",
"rc('legend', **{'frameon': False})"
]
},
{
"cell_type": "code",
"execution_count": 95,
"metadata": {},
"outputs": [],
"source": [
"universe_name = 'zz800'\n",
"trade_date = '2019-01-15'\n",
"factor = 'EPS'\n",
"industry_name = '申万行业分类'\n",
"benchmark_code = 906\n",
"max_active_industry_exposure = 0.\n",
"max_active_single_stock_exposure = 0.02\n",
"con = sa.create_engine(os.environ['DB_URI'])"
]
},
{
"cell_type": "code",
"execution_count": 96,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Wall time: 457 ms\n"
]
}
],
"source": [
"%%time\n",
"\n",
"big_table = outerjoin(Uqer, Universe, and_(Uqer.trade_date == Universe.trade_date,\n",
" Uqer.code == Universe.code))\n",
"\n",
"query = select([Uqer.code, getattr(Uqer, factor)]).select_from(big_table) \\\n",
" .where(and_(Uqer.trade_date == trade_date, \n",
" getattr(Universe, universe_name) == 1))\n",
"\n",
"factors = pd.read_sql(query, con=con)\n",
"factors.head()"
]
},
{
"cell_type": "code",
"execution_count": 97,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Wall time: 160 ms\n"
]
}
],
"source": [
"%%time\n",
"\n",
"big_table = outerjoin(Industry, Universe, and_(Industry.trade_date == Universe.trade_date,\n",
" Industry.code == Universe.code))\n",
"\n",
"query = select([Industry.code, Industry.industryName1]).select_from(big_table) \\\n",
" .where(and_(Industry.trade_date == trade_date,\n",
" Industry.industry == industry_name,\n",
" getattr(Universe, universe_name) == 1))\n",
"\n",
"industry = pd.read_sql(query, con=con)\n",
"industry.head()"
]
},
{
"cell_type": "code",
"execution_count": 98,
"metadata": {},
"outputs": [],
"source": [
"df = pd.merge(factors, industry, on=['code'], how='inner').dropna()\n",
"industry_dummy = pd.get_dummies(df.industryName1)"
]
},
{
"cell_type": "code",
"execution_count": 99,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Wall time: 1 ms\n"
]
}
],
"source": [
"%%time\n",
"\n",
"df['neutralized_factor'] = neutralize(industry_dummy.values.astype(float), df[factor].values).flatten()"
]
},
{
"cell_type": "code",
"execution_count": 100,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Wall time: 113 ms\n"
]
}
],
"source": [
"%%time\n",
"\n",
"big_table = outerjoin(IndexComponent, Universe, and_(IndexComponent.trade_date == Universe.trade_date,\n",
" IndexComponent.code == Universe.code))\n",
"\n",
"query = select([IndexComponent.code, (IndexComponent.weight / 100.).label('index_weight')]) \\\n",
" .where(and_(IndexComponent.trade_date == trade_date,\n",
" IndexComponent.indexCode == benchmark_code))\n",
"\n",
"index_components = pd.read_sql(query, con=con)\n",
"index_components.head()"
]
},
{
"cell_type": "code",
"execution_count": 101,
"metadata": {},
"outputs": [],
"source": [
"df = pd.merge(df, index_components, on=['code'], how='inner').dropna()"
]
},
{
"cell_type": "code",
"execution_count": 111,
"metadata": {},
"outputs": [],
"source": [
"er = df.neutralized_factor.values\n",
"lbound = np.maximum(-max_active_single_stock_exposure, -df['index_weight'].values)\n",
"ubound = max_active_single_stock_exposure\n",
"risk_constraints = np.concatenate((industry_dummy, np.ones((len(er), 1))), axis=1)\n",
"industry_low_bounds = -max_active_industry_exposure * np.ones(industry_dummy.shape[1])\n",
"industry_up_bounds = max_active_industry_exposure * np.ones(industry_dummy.shape[1])\n",
"risk_target = (np.concatenate((industry_low_bounds, [0.])),\n",
" np.concatenate((industry_up_bounds, [0.])),)"
]
},
{
"cell_type": "code",
"execution_count": 112,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Wall time: 8.98 ms\n"
]
}
],
"source": [
"%%time\n",
"\n",
"status, optimized_values, weights = linear_builder(er,\n",
" lbound,\n",
" ubound,\n",
" risk_constraints,\n",
" risk_target)"
]
},
{
"cell_type": "code",
"execution_count": 129,
"metadata": {},
"outputs": [],
"source": [
"df['portfolio_weight'] = df['index_weight'] + weights\n",
"df['active_weight'] = weights"
]
},
{
"cell_type": "code",
"execution_count": 137,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"<matplotlib.axes._subplots.AxesSubplot at 0x193c2c75f28>"
]
},
"execution_count": 137,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 1008x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"df.groupby('industryName1').sum().plot.bar(y=['index_weight', 'portfolio_weight'], figsize=(14, 7))"
]
},
{
"cell_type": "code",
"execution_count": 139,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"(-0.02, 0.025)"
]
},
"execution_count": 139,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 1008x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"df.plot(kind='scatter', x='neutralized_factor', y='active_weight', figsize=(14, 7))\n",
"plt.xlim((-5, 5))\n",
"plt.ylim((-0.02, 0.025))"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.8"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment