Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Sign in
Toggle navigation
A
alpha-mind
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Dr.李
alpha-mind
Commits
339dabd6
Commit
339dabd6
authored
Aug 19, 2017
by
Dr.李
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
added date range api
parent
1acf5b7a
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
130 additions
and
15 deletions
+130
-15
sqlengine.py
alphamind/data/engines/sqlengine.py
+107
-13
universe.py
alphamind/data/engines/universe.py
+23
-2
No files found.
alphamind/data/engines/sqlengine.py
View file @
339dabd6
...
...
@@ -13,7 +13,7 @@ import numpy as np
import
pandas
as
pd
import
sqlalchemy
as
sa
import
sqlalchemy.orm
as
orm
from
sqlalchemy
import
select
,
and_
,
outerjoin
from
sqlalchemy
import
select
,
and_
,
outerjoin
,
join
from
sqlalchemy.sql
import
func
from
alphamind.data.engines.universe
import
Universe
from
alphamind.data.dbmodel.models
import
FactorMaster
...
...
@@ -143,13 +143,19 @@ class SqlEngine(object):
strategy_names
=
{
s
[
0
]
for
s
in
cursor
.
fetchall
()}
return
strategy_names
def
fetch_codes
(
self
,
ref_date
:
str
,
univ
:
Universe
)
->
List
[
int
]:
query
=
univ
.
query
(
ref_date
)
def
fetch_codes
(
self
,
ref_date
:
str
,
univ
erse
:
Universe
)
->
List
[
int
]:
query
=
univ
erse
.
query
(
ref_date
)
cursor
=
self
.
engine
.
execute
(
query
)
codes_set
=
{
c
[
0
]
for
c
in
cursor
.
fetchall
()}
codes_set
=
{
c
[
1
]
for
c
in
cursor
.
fetchall
()}
return
sorted
(
codes_set
)
def
fetch_codes_range
(
self
,
start_date
:
str
,
end_date
:
str
,
universe
:
Universe
)
->
pd
.
DataFrame
:
query
=
universe
.
query_range
(
start_date
,
end_date
)
return
pd
.
read_sql
(
query
,
self
.
engine
)
def
fetch_dx_return
(
self
,
ref_date
,
codes
,
expiry_date
=
None
,
horizon
=
0
):
start_date
=
ref_date
...
...
@@ -183,6 +189,24 @@ class SqlEngine(object):
return
pd
.
read_sql
(
query
,
self
.
engine
)
def
fetch_factor_range
(
self
,
start_date
:
str
,
end_date
:
str
,
factors
:
Iterable
[
str
],
universe
:
Universe
)
->
pd
.
DataFrame
:
factor_cols
=
_map_factors
(
factors
)
q2
=
universe
.
query_range
(
start_date
,
end_date
)
.
alias
(
'temp_universe'
)
big_table
=
join
(
Market
,
q2
,
and_
(
Market
.
Date
==
q2
.
c
.
Date
,
Market
.
Code
==
q2
.
c
.
Code
))
for
t
in
set
(
factor_cols
.
values
()):
big_table
=
outerjoin
(
big_table
,
t
,
and_
(
Market
.
Date
==
t
.
Date
,
Market
.
Code
==
t
.
Code
))
query
=
select
([
Market
.
Date
,
Market
.
Code
,
Market
.
isOpen
]
+
list
(
factor_cols
.
keys
()))
\
.
select_from
(
big_table
)
return
pd
.
read_sql
(
query
,
self
.
engine
)
def
fetch_benchmark
(
self
,
ref_date
:
str
,
benchmark
:
int
)
->
pd
.
DataFrame
:
...
...
@@ -195,6 +219,19 @@ class SqlEngine(object):
return
pd
.
read_sql
(
query
,
self
.
engine
)
def
fetch_benchmark_range
(
self
,
start_date
:
str
,
end_date
:
str
,
benchmark
:
int
)
->
pd
.
DataFrame
:
query
=
select
([
IndexComponent
.
Date
,
IndexComponent
.
Code
,
(
IndexComponent
.
weight
/
100.
)
.
label
(
'weight'
)])
.
where
(
and_
(
IndexComponent
.
Date
.
between
(
start_date
,
end_date
),
IndexComponent
.
indexCode
==
benchmark
)
)
return
pd
.
read_sql
(
query
,
self
.
engine
)
def
fetch_risk_model
(
self
,
ref_date
:
str
,
codes
:
Iterable
[
int
],
...
...
@@ -222,6 +259,39 @@ class SqlEngine(object):
return
risk_cov
,
risk_exp
def
fetch_risk_model_range
(
self
,
start_date
:
str
,
end_date
:
str
,
universe
:
Universe
,
risk_model
:
str
=
'short'
)
->
Tuple
[
pd
.
DataFrame
,
pd
.
DataFrame
]:
risk_cov_table
,
special_risk_table
=
_map_risk_model_table
(
risk_model
)
cov_risk_cols
=
[
risk_cov_table
.
__table__
.
columns
[
f
]
for
f
in
total_risk_factors
]
query
=
select
([
risk_cov_table
.
Date
,
risk_cov_table
.
FactorID
,
risk_cov_table
.
Factor
]
+
cov_risk_cols
)
.
where
(
risk_cov_table
.
Date
.
between
(
start_date
,
end_date
)
)
risk_cov
=
pd
.
read_sql
(
query
,
self
.
engine
)
.
sort_values
([
'Date'
,
'FactorID'
])
risk_exposure_cols
=
[
RiskExposure
.
__table__
.
columns
[
f
]
for
f
in
total_risk_factors
]
big_table
=
outerjoin
(
special_risk_table
,
RiskExposure
,
and_
(
special_risk_table
.
Date
==
RiskExposure
.
Date
,
special_risk_table
.
Code
==
RiskExposure
.
Code
))
q2
=
universe
.
query_range
(
start_date
,
end_date
)
.
alias
(
'temp_universe'
)
big_table
=
join
(
big_table
,
q2
,
and_
(
special_risk_table
.
Date
==
q2
.
c
.
Date
,
special_risk_table
.
Code
==
q2
.
c
.
Code
))
query
=
select
(
[
RiskExposure
.
Date
,
RiskExposure
.
Code
,
special_risk_table
.
SRISK
]
+
risk_exposure_cols
)
\
.
select_from
(
big_table
)
risk_exp
=
pd
.
read_sql
(
query
,
self
.
engine
)
return
risk_cov
,
risk_exp
def
fetch_data
(
self
,
ref_date
,
factors
:
Iterable
[
str
],
codes
:
Iterable
[
int
],
...
...
@@ -248,6 +318,34 @@ class SqlEngine(object):
append_industry_info
(
factor_data
)
return
total_data
def
fetch_data_range
(
self
,
start_date
:
str
,
end_date
:
str
,
factors
:
Iterable
[
str
],
universe
:
Universe
,
benchmark
:
int
=
None
,
risk_model
:
str
=
'short'
)
->
Dict
[
str
,
pd
.
DataFrame
]:
total_data
=
{}
factor_data
=
self
.
fetch_factor_range
(
start_date
,
end_date
,
factors
,
universe
)
if
benchmark
:
benchmark_data
=
self
.
fetch_benchmark_range
(
start_date
,
end_date
,
benchmark
)
total_data
[
'benchmark'
]
=
benchmark_data
factor_data
=
pd
.
merge
(
factor_data
,
benchmark_data
,
how
=
'left'
,
on
=
[
'Date'
,
'Code'
])
factor_data
[
'weight'
]
=
factor_data
[
'weight'
]
.
fillna
(
0.
)
if
risk_model
:
risk_cov
,
risk_exp
=
self
.
fetch_risk_model_range
(
start_date
,
end_date
,
universe
,
risk_model
)
factor_data
=
pd
.
merge
(
factor_data
,
risk_exp
,
how
=
'left'
,
on
=
[
'Date'
,
'Code'
])
total_data
[
'risk_cov'
]
=
risk_cov
total_data
[
'factor'
]
=
factor_data
append_industry_info
(
factor_data
)
return
total_data
if
__name__
==
'__main__'
:
db_url
=
'postgresql+psycopg2://postgres:we083826@localhost/alpha'
...
...
@@ -256,12 +354,8 @@ if __name__ == '__main__':
engine
=
SqlEngine
(
db_url
)
ref_date
=
'2017-08-10'
codes
=
engine
.
fetch_codes
(
ref_date
,
universe
)
data
=
engine
.
fetch_data
(
ref_date
,
[
'EPS'
],
codes
,
905
,
'short'
)
d1ret
=
engine
.
fetch_dx_return
(
ref_date
,
codes
,
horizon
=
0
)
missing_codes
=
[
c
for
c
in
data
[
'factor'
]
.
Code
if
c
not
in
set
(
d1ret
.
Code
)]
codes
=
engine
.
fetch_codes_range
(
'2017-01-01'
,
'2017-08-10'
,
universe
)
data
=
engine
.
fetch_data_range
(
'2017-01-01'
,
'2017-08-10'
,
[
'EPS'
],
universe
,
905
,
'short'
)
print
(
codes
)
print
(
data
)
print
(
len
(
data
[
'factor'
]))
print
(
len
(
d1ret
))
print
(
missing_codes
)
alphamind/data/engines/universe.py
View file @
339dabd6
...
...
@@ -30,8 +30,7 @@ class Universe(object):
self
.
include_codes
=
include_codes
self
.
exclude_codes
=
exclude_codes
def
query
(
self
,
ref_date
):
query
=
select
([
UniverseTable
.
Code
])
.
distinct
()
def
_create_condition
(
self
):
all_and_conditions
=
[]
...
...
@@ -55,6 +54,12 @@ class Universe(object):
codes_in
=
UniverseTable
.
Code
.
in_
(
self
.
include_codes
)
all_or_conditions
.
append
(
codes_in
)
return
all_and_conditions
,
all_or_conditions
def
query
(
self
,
ref_date
):
query
=
select
([
UniverseTable
.
Date
,
UniverseTable
.
Code
])
.
distinct
()
all_and_conditions
,
all_or_conditions
=
self
.
_create_condition
()
query
=
query
.
where
(
and_
(
UniverseTable
.
Date
==
ref_date
,
...
...
@@ -66,3 +71,19 @@ class Universe(object):
)
return
query
def
query_range
(
self
,
start_date
,
end_date
):
query
=
select
([
UniverseTable
.
Date
,
UniverseTable
.
Code
])
.
distinct
()
all_and_conditions
,
all_or_conditions
=
self
.
_create_condition
()
query
=
query
.
where
(
and_
(
UniverseTable
.
Date
.
between
(
start_date
,
end_date
),
or_
(
and_
(
*
all_and_conditions
),
*
all_or_conditions
)
)
)
return
query
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment