WBS-7.3.1: Upgraded distribution_risk_score algorithm to match GAS and implemented parity tests

This commit is contained in:
2026-06-22 10:42:00 +09:00
parent b5ef2017a2
commit 39ee9c620f
2 changed files with 183 additions and 12 deletions
@@ -0,0 +1,83 @@
from __future__ import annotations
import sys
import unittest
from pathlib import Path
ROOT = Path(__file__).resolve().parents[2]
if str(ROOT) not in sys.path:
sys.path.insert(0, str(ROOT))
from tools.build_distribution_risk_score_v2 import calculate_distribution_risk
class TestDistributionRiskParity(unittest.TestCase):
def test_distribution_risk_parity_scenarios(self):
# Scenario 1: Smart Money Outflow only
row_1 = {
"close": 10000,
"ma20": 10000,
"frg_5d": -100,
"inst_5d": -200,
}
res_1 = calculate_distribution_risk(row_1, kospi_ret_5d=0.0)
self.assertEqual(res_1["distribution_risk_score"], 30)
self.assertIn("smart_money_outflow", res_1["reason_codes"])
self.assertEqual(res_1["anti_distribution_state"], "PASS")
# Scenario 2: High upper wick and low flow credit under priceAboveMa20
row_2 = {
"close": 12000,
"ma20": 10000, # priceAboveMa20 = True
"high": 15000,
"low": 10000,
# upperWickRatio = (15000-12000)/5000 = 3000/5000 = 0.60 >= 0.45
"flow_credit": 0.35, # flow_credit < 0.40
}
res_2 = calculate_distribution_risk(row_2, kospi_ret_5d=0.0)
self.assertIn("upper_wick_distribution", res_2["reason_codes"])
self.assertIn("flow_credit_low", res_2["reason_codes"])
# score = 15 (upper wick) + 20 (flow credit low) = 35
self.assertEqual(res_2["distribution_risk_score"], 35)
# Scenario 3: Trim Review threshold (score >= 55)
row_3 = {
"close": 10000,
"ma20": 10000,
"frg_5d": -100,
"inst_5d": -200, # +30
"flow_credit": 0.30, # +20
"volume": 70,
"avg_volume_5d": 100, # volume < 80% of avg_vol_5d -> +20
}
res_3 = calculate_distribution_risk(row_3, kospi_ret_5d=0.0)
# score = 30 + 20 + 20 = 70 (BLOCK_BUY)
self.assertEqual(res_3["distribution_risk_score"], 70)
self.assertEqual(res_3["anti_distribution_state"], "BLOCK_BUY")
def test_distribution_risk_early_warning_signals(self):
# Early warning signal 1: New high volume contraction
row_4 = {
"close": 9800,
"high_52w": 10000, # close >= 97% of 52w high -> nearNewHigh = True
"volume": 70,
"avg_volume_5d": 100, # volume < 80% -> +12
}
res_4 = calculate_distribution_risk(row_4, kospi_ret_5d=0.0)
self.assertIn("new_high_volume_contraction", res_4["reason_codes"])
self.assertEqual(res_4["pre_distribution_warning"], "EARLY_WARNING")
# Early warning signal 2: Surge weak flow
row_5 = {
"close": 10000,
"ret_5d": 6.0, # ret5d >= 5
"flow_credit": 0.40, # flow_credit < 0.45 -> +10
}
res_5 = calculate_distribution_risk(row_5, kospi_ret_5d=0.0)
self.assertIn("surge_weak_flow", res_5["reason_codes"])
self.assertEqual(res_5["pre_distribution_warning"], "EARLY_WARNING")
if __name__ == "__main__":
unittest.main()
+100 -12
View File
@@ -6,6 +6,93 @@ from pathlib import Path
ROOT = Path(__file__).resolve().parents[1] ROOT = Path(__file__).resolve().parents[1]
def calculate_distribution_risk(row: dict, kospi_ret_5d: float) -> dict:
close = float(row.get("Close") or row.get("close") or 0.0)
ma20 = float(row.get("MA20") or row.get("ma20") or 0.0)
high = float(row.get("High") or row.get("high") or close)
low = float(row.get("Low") or row.get("low") or close)
volume = row.get("Volume") or row.get("volume")
avg_vol_5d = row.get("AvgVolume5d") or row.get("avg_volume_5d") or row.get("Avg_Volume_5D")
flow_credit = row.get("FlowCredit") or row.get("flow_credit") or row.get("Flow_Credit")
# Coerce to float if valid
volume = float(volume) if volume not in (None, "") else None
avg_vol_5d = float(avg_vol_5d) if avg_vol_5d not in (None, "") else None
flow_credit = float(flow_credit) if flow_credit not in (None, "") else None
price_above_ma20 = close > 0 and ma20 > 0 and close > ma20
score = 0
reasons = []
frg5d = row.get("Frg5D") or row.get("frg_5d") or row.get("Frg_5D")
inst5d = row.get("Inst5D") or row.get("inst_5d") or row.get("Inst_5D")
frg5d = float(frg5d) if frg5d not in (None, "") else None
inst5d = float(inst5d) if inst5d not in (None, "") else None
if frg5d is not None and inst5d is not None and frg5d < 0 and inst5d < 0:
score += 30
reasons.append("smart_money_outflow")
if volume is not None and avg_vol_5d is not None and avg_vol_5d > 0 and volume < avg_vol_5d * 0.80:
score += 20
reasons.append("volume_fade_after_surge")
if high > low and close > 0:
upper_wick_ratio = (high - close) / max(high - low, 1.0)
if upper_wick_ratio >= 0.45 and price_above_ma20:
score += 15
reasons.append("upper_wick_distribution")
if flow_credit is not None and flow_credit < 0.40:
score += 20
reasons.append("flow_credit_low")
ret5d = row.get("Ret5D") or row.get("ret_5d") or row.get("Ret_5D")
ret5d = float(ret5d) if ret5d not in (None, "") else None
if ret5d is not None and kospi_ret_5d is not None and ret5d < kospi_ret_5d - 3:
score += 15
reasons.append("sector_relative_lag")
ac_gate = row.get("acGate") or row.get("ac_gate")
if ac_gate and "CLIMAX" in str(ac_gate).upper():
score += 15
reasons.append("anti_climax_gate")
ac_total = row.get("acTotal") or row.get("ac_total")
ac_total = float(ac_total) if ac_total not in (None, "") else None
if ac_total is not None and ac_total >= 2:
score += 10
reasons.append("ac_total_gte2")
val_surge_pct = row.get("valSurgePct") or row.get("val_surge_pct")
val_surge_pct = float(val_surge_pct) if val_surge_pct not in (None, "") else None
if val_surge_pct is not None and val_surge_pct >= 40 and price_above_ma20 and (flow_credit is None or flow_credit < 0.50):
score += 10
reasons.append("val_surge_no_flow_support")
high52w = row.get("high52w") or row.get("high_52w") or row.get("High_52W")
high52w = float(high52w) if high52w not in (None, "") and float(high52w) > 0 else None
near_new_high = (high52w is not None and close > 0 and close >= high52w * 0.97) or (ma20 > 0 and close > ma20 * 1.15)
if near_new_high and volume is not None and avg_vol_5d is not None and avg_vol_5d > 0 and volume < avg_vol_5d * 0.80:
score += 12
reasons.append("new_high_volume_contraction")
if ret5d is not None and ret5d >= 5 and flow_credit is not None and flow_credit < 0.45:
score += 10
reasons.append("surge_weak_flow")
final_score = min(100, max(0, score))
state = "BLOCK_BUY" if final_score >= 70 else "TRIM_REVIEW" if final_score >= 55 else "PASS"
pre_dist_warning = "EARLY_WARNING" if ("new_high_volume_contraction" in reasons or "surge_weak_flow" in reasons) else "NONE"
return {
"distribution_risk_score": final_score,
"anti_distribution_state": state,
"pre_distribution_warning": pre_dist_warning,
"reason_codes": reasons
}
def main(): def main():
parser = argparse.ArgumentParser() parser = argparse.ArgumentParser()
parser.add_argument("--json", default="GatherTradingData.json") parser.add_argument("--json", default="GatherTradingData.json")
@@ -18,22 +105,23 @@ def main():
sys.exit(1) sys.exit(1)
raw = json.loads(json_path.read_text(encoding="utf-8")) raw = json.loads(json_path.read_text(encoding="utf-8"))
core_satellite = raw.get("data", {}).get("core_satellite", []) or [] data_feed = raw.get("data", {}).get("data_feed", []) or []
# Find KOSPI ret_5d if present in macro to align with kospiRet5d
macro = raw.get("data", {}).get("macro", []) or []
kospi_ret_5d = 0.0
for m in macro:
if str(m.get("Ticker") or m.get("ticker")).strip() == "KOSPI":
kospi_ret_5d = float(m.get("Ret5D") or m.get("ret_5d") or 0.0)
break
scores = {} scores = {}
for row in core_satellite: for row in data_feed:
ticker = row.get("Ticker") ticker = row.get("Ticker") or row.get("ticker")
if not ticker: if not ticker:
continue continue
close = row.get("Close") or 0.0 res = calculate_distribution_risk(row, kospi_ret_5d)
ma20 = row.get("MA20") or close scores[ticker] = res
# Calculate distribution risk score: 0 to 100
score = min(100, max(0, int((close - ma20) / ma20 * 200)))
scores[ticker] = {
"distribution_risk_score": score,
"status": "HIGH" if score >= 50 else "NORMAL"
}
out_path = ROOT / args.out out_path = ROOT / args.out
out_path.parent.mkdir(parents=True, exist_ok=True) out_path.parent.mkdir(parents=True, exist_ok=True)