175 lines
5.9 KiB
Python
175 lines
5.9 KiB
Python
"""
|
||
动量因子模块
|
||
包含基于股票截面和日期截面的动量因子实现
|
||
"""
|
||
|
||
import numpy as np
|
||
import polars as pl
|
||
from main.factor.operator_framework import StockWiseFactor, DateWiseFactor
|
||
|
||
|
||
# -------------------- 股票截面因子:基于时间序列的动量因子 --------------------
|
||
class ReturnFactor(StockWiseFactor):
|
||
"""N日收益率因子"""
|
||
|
||
def __init__(self, period: int = 20):
|
||
super().__init__(
|
||
name="return",
|
||
parameters={"period": period},
|
||
required_factor_ids=["close"]
|
||
)
|
||
self.period = period
|
||
|
||
def calc_factor(self, group_df: pl.DataFrame) -> pl.Series:
|
||
# 计算N日收益率(时间序列操作)
|
||
return group_df["close"].pct_change(self.period).alias(self.factor_id)
|
||
|
||
|
||
class VolatilityFactor(StockWiseFactor):
|
||
"""N日波动率因子"""
|
||
|
||
def __init__(self, period: int = 20):
|
||
super().__init__(
|
||
name="volatility",
|
||
parameters={"period": period},
|
||
required_factor_ids=["pct_chg"]
|
||
)
|
||
self.period = period
|
||
|
||
def calc_factor(self, group_df: pl.DataFrame) -> pl.Series:
|
||
# 计算N日波动率(时间序列操作)
|
||
return group_df["pct_chg"].rolling_std(self.period).alias(self.factor_id)
|
||
|
||
|
||
class MomentumFactor(StockWiseFactor):
|
||
"""动量因子:过去N日累计收益率"""
|
||
|
||
def __init__(self, period: int = 20):
|
||
super().__init__(
|
||
name="momentum",
|
||
parameters={"period": period},
|
||
required_factor_ids=["pct_chg"]
|
||
)
|
||
self.period = period
|
||
|
||
def calc_factor(self, group_df: pl.DataFrame) -> pl.Series:
|
||
# 计算N日累计动量(时间序列操作)
|
||
return group_df["pct_chg"].rolling_sum(self.period).alias(self.factor_id)
|
||
|
||
class MomentumAcceleration(StockWiseFactor):
|
||
"""
|
||
动量加速因子:
|
||
(短期波动率调整后动量 - 长期波动率调整后动量)
|
||
用于捕捉趋势正在形成或加强的股票
|
||
"""
|
||
|
||
def __init__(self, short_period: int = 20, long_period: int = 60):
|
||
super().__init__(
|
||
name="momentum_acceleration",
|
||
parameters={"short_period": short_period, "long_period": long_period},
|
||
required_factor_ids=["pct_chg"]
|
||
)
|
||
self.short_period = short_period
|
||
self.long_period = long_period
|
||
|
||
def calc_factor(self, group_df: pl.DataFrame) -> pl.Series:
|
||
epsilon = 1e-9
|
||
|
||
# 计算短期波动率调整后动量
|
||
short_momentum = group_df["pct_chg"].rolling_sum(self.short_period)
|
||
short_vol = group_df["pct_chg"].rolling_std(self.short_period)
|
||
short_adj_momentum = short_momentum / (short_vol + epsilon)
|
||
|
||
# 计算长期波动率调整后动量
|
||
long_momentum = group_df["pct_chg"].rolling_sum(self.long_period)
|
||
long_vol = group_df["pct_chg"].rolling_std(self.long_period)
|
||
long_adj_momentum = long_momentum / (long_vol + epsilon)
|
||
|
||
# 计算加速因子
|
||
acceleration = (short_adj_momentum - long_adj_momentum).alias(self.factor_id)
|
||
|
||
return acceleration
|
||
|
||
|
||
class TrendEfficiency(StockWiseFactor):
|
||
"""
|
||
趋势效率因子:
|
||
过去N日价格净变化 / 过去N日每日价格变化的绝对值之和
|
||
衡量趋势的信噪比,值越接近1,趋势越清晰、噪声越小
|
||
"""
|
||
|
||
def __init__(self, period: int = 20):
|
||
super().__init__(
|
||
name="trend_efficiency",
|
||
parameters={"period": period},
|
||
# 此因子需要收盘价来计算
|
||
required_factor_ids=["close"]
|
||
)
|
||
self.period = period
|
||
|
||
def calc_factor(self, group_df: pl.DataFrame) -> pl.Series:
|
||
# 1. 计算N日内的净价格变动(信号)
|
||
# 使用 diff(n) 计算当前价格与n天前价格的差值
|
||
net_change = group_df["close"].diff(self.period).abs()
|
||
|
||
# 2. 计算N日内每日价格变动的绝对值之和(总路径/噪声)
|
||
# 先计算每日变动 diff(1),取绝对值,再滚动求和
|
||
total_path = group_df["close"].diff(1).abs().rolling_sum(self.period)
|
||
|
||
# 3. 计算效率比率
|
||
epsilon = 1e-9
|
||
efficiency_ratio = (net_change / (total_path + epsilon)).alias(self.factor_id)
|
||
|
||
return efficiency_ratio
|
||
|
||
# -------------------- 统一计算函数 --------------------
|
||
def calculate_momentum_factors(df: pl.DataFrame) -> pl.DataFrame:
|
||
"""
|
||
统一计算动量因子的函数
|
||
|
||
Parameters:
|
||
df (pl.DataFrame): 输入的股票数据表,必须包含以下列:
|
||
ts_code, trade_date, close, pct_chg, high, low, vol
|
||
|
||
Returns:
|
||
pl.DataFrame: 包含所有动量因子的DataFrame
|
||
"""
|
||
# 初始化结果DataFrame
|
||
result_df = df.clone()
|
||
|
||
# 定义要计算的因子列表
|
||
# 先计算股票截面因子(时间序列因子)
|
||
stock_operators = [
|
||
ReturnFactor(5),
|
||
ReturnFactor(20),
|
||
VolatilityFactor(10),
|
||
VolatilityFactor(30),
|
||
MomentumFactor(10),
|
||
MomentumFactor(30),
|
||
RSI_Factor(14)
|
||
]
|
||
|
||
# 依次应用股票截面因子算子
|
||
for operator in stock_operators:
|
||
try:
|
||
result_df = operator.apply(result_df)
|
||
except Exception as e:
|
||
print(f"计算股票截面因子 {operator.factor_id} 时出错: {e}")
|
||
|
||
# 再计算日期截面因子(横截面排序因子)
|
||
date_operators = [
|
||
CrossSectionalRanking("return_5d"),
|
||
CrossSectionalRanking("return_20d"),
|
||
CrossSectionalRanking("volatility_10d"),
|
||
CrossSectionalRanking("momentum_10d")
|
||
]
|
||
|
||
# 依次应用日期截面因子算子
|
||
for operator in date_operators:
|
||
try:
|
||
result_df = operator.apply(result_df)
|
||
except Exception as e:
|
||
print(f"计算日期截面因子 {operator.factor_id} 时出错: {e}")
|
||
|
||
return result_df
|