migrate: remove final JSON cold backup lines, prune/branch→DB

2026-07-03 12:41:20 +08:00
parent b3bedc8024
commit 9124a7ad56
5 changed files with 285 additions and 264 deletions
@@ -1,126 +1,133 @@
-#!/usr/bin/env python3
-"""
-branch_scanner.py — 分支自成长数据采集器（全静默）
-
-核心功能（三件事，全部后台静默执行）：
-1. 每轮扫描42只股票，评估当前情景下各分支的适用性
-2. 适用分支 → trigger_count + 1，记录 last_triggered
-3. 保存当前状态到 scanner_state.json 供下次对比
-
-无输出 → 静默运行。触发数据积累在 decisions.json。
-操作信号由 stale_push_wlin / price_monitor / 开盘收盘简报 另路输出。
-
-数据流向（自成长）：每15分钟branch_scanner积累trigger_count →
-  每日prune_branches评估低效分支 → decisions.json修剪 → 分支越来越有效
-"""
-
-import json, sys, re
-from datetime import datetime
-from urllib.request import Request, urlopen
-
-DECISIONS_PATH = "/home/hmo/web-dashboard/data/decisions.json"
-SCANNER_STATE = "/home/hmo/web-dashboard/data/scanner_state.json"
-
-
-def get_price(code):
-    # DB 优先
-    try: from mofin_db import get_price_from_db; p, _ = get_price_from_db(code); return p if p else 0
-    except: pass
-    # Fallback: 腾讯
-    mkt = "sh" if code.startswith("6") or code.startswith("5") else "sz"
-    url = f"http://qt.gtimg.cn/q={mkt}{code}"
-    req = Request(url, headers={"User-Agent": "Mozilla/5.0"})
-    try:
-        resp = urlopen(req, timeout=5).read().decode("gbk")
-        parts = resp.split("~")
-        if len(parts) > 3:
-            return float(parts[3])
-    except Exception:
-        return None
-
-
-def get_scenario():
-    try:
-        sys.path.insert(0, "/home/hmo/MoFin")
-        from strategy_tree import detect_scenario
-        return detect_scenario()
-    except Exception:
-        return {"id": "unknown", "label": "未知", "confidence": 0}
-
-
-def check_condition(branch, scenario_id, price):
-    cond = branch.get("condition", {})
-    required_scenario = cond.get("scenario", "")
-    if required_scenario and required_scenario != scenario_id:
-        return False
-    price_cond = cond.get("price", "")
-    if price_cond and price:
-        ops = re.findall(r"([<>=!]+)\s*([\d.]+)", price_cond)
-        for op, val_str in ops:
-            val = float(val_str)
-            if op == "<" and not (price < val): return False
-            if op == ">" and not (price > val): return False
-            if op == "<=" and not (price <= val): return False
-            if op == ">=" and not (price >= val): return False
-    price_lower = cond.get("price_lower", "")
-    if price_lower and price:
-        ops = re.findall(r"([<>=!]+)\s*([\d.]+)", price_lower)
-        for op, val_str in ops:
-            val = float(val_str)
-            if op == "<" and not (price < val): return False
-            if op == ">" and not (price > val): return False
-            if op == "<=" and not (price <= val): return False
-            if op == ">=" and not (price >= val): return False
-    return True
-
-
-def main():
-    now = datetime.now()
-    if now.hour < 9 or now.hour > 16:
-        return 0
-
-    scenario = get_scenario()
-    sid = scenario.get("id", "unknown")
-
-    with open(DECISIONS_PATH) as f:
-        data = json.load(f)
-    decisions = data.get("decisions", [])
-
-    for entry in decisions:
-        code = entry.get("code", "")
-        tree = entry.get("strategy_tree", {})
-        branches = tree.get("branches", [])
-        if not branches:
-            continue
-        price = get_price(code)
-        if not price:
-            continue
-        for br in sorted(branches, key=lambda b: b.get("priority", 999)):
-            if check_condition(br, sid, price):
-                br["trigger_count"] = br.get("trigger_count", 0) + 1
-                br["last_triggered"] = now.strftime("%Y-%m-%d")
-                break
-
-    with open(DECISIONS_PATH, "w") as f:
-        json.dump(data, f, indent=2, ensure_ascii=False)
-
-    # 更新状态快照
-    state = {"scenario": sid, "updated_at": now.isoformat(), "branches": {}}
-    for e in decisions:
-        code = e.get("code", "")
-        tree = e.get("strategy_tree", {})
-        for br in sorted(tree.get("branches", []), key=lambda b: b.get("priority", 999)):
-            if check_condition(br, sid, get_price(code)):
-                state["branches"][code] = br.get("id", "")
-                break
-    try:
-        with open(SCANNER_STATE, "w") as f:
-            json.dump(state, f, indent=2)
-    except Exception:
-        pass
-
-    return 0
-
-
-if __name__ == "__main__":
-    sys.exit(main())
+#!/usr/bin/env python3
+"""
+branch_scanner.py — 分支自成长数据采集器（全静默）
+
+核心功能（三件事，全部后台静默执行）：
+1. 每轮扫描42只股票，评估当前情景下各分支的适用性
+2. 适用分支 → trigger_count + 1，记录 last_triggered
+3. 保存当前状态到 scanner_state.json 供下次对比
+
+无输出 → 静默运行。触发数据积累在 decisions.json。
+操作信号由 stale_push_wlin / price_monitor / 开盘收盘简报 另路输出。
+
+数据流向（自成长）：每15分钟branch_scanner积累trigger_count →
+  每日prune_branches评估低效分支 → decisions.json修剪 → 分支越来越有效
+"""
+
+import json, sys, re
+from datetime import datetime
+from urllib.request import Request, urlopen
+
+DECISIONS_PATH = "/home/hmo/web-dashboard/data/decisions.json"
+SCANNER_STATE = "/home/hmo/web-dashboard/data/scanner_state.json"
+
+
+def get_price(code):
+    # DB 优先
+    try: from mofin_db import get_price_from_db; p, _ = get_price_from_db(code); return p if p else 0
+    except: pass
+    # Fallback: 腾讯
+    mkt = "sh" if code.startswith("6") or code.startswith("5") else "sz"
+    url = f"http://qt.gtimg.cn/q={mkt}{code}"
+    req = Request(url, headers={"User-Agent": "Mozilla/5.0"})
+    try:
+        resp = urlopen(req, timeout=5).read().decode("gbk")
+        parts = resp.split("~")
+        if len(parts) > 3:
+            return float(parts[3])
+    except Exception:
+        return None
+
+
+def get_scenario():
+    try:
+        sys.path.insert(0, "/home/hmo/MoFin")
+        from strategy_tree import detect_scenario
+        return detect_scenario()
+    except Exception:
+        return {"id": "unknown", "label": "未知", "confidence": 0}
+
+
+def check_condition(branch, scenario_id, price):
+    cond = branch.get("condition", {})
+    required_scenario = cond.get("scenario", "")
+    if required_scenario and required_scenario != scenario_id:
+        return False
+    price_cond = cond.get("price", "")
+    if price_cond and price:
+        ops = re.findall(r"([<>=!]+)\s*([\d.]+)", price_cond)
+        for op, val_str in ops:
+            val = float(val_str)
+            if op == "<" and not (price < val): return False
+            if op == ">" and not (price > val): return False
+            if op == "<=" and not (price <= val): return False
+            if op == ">=" and not (price >= val): return False
+    price_lower = cond.get("price_lower", "")
+    if price_lower and price:
+        ops = re.findall(r"([<>=!]+)\s*([\d.]+)", price_lower)
+        for op, val_str in ops:
+            val = float(val_str)
+            if op == "<" and not (price < val): return False
+            if op == ">" and not (price > val): return False
+            if op == "<=" and not (price <= val): return False
+            if op == ">=" and not (price >= val): return False
+    return True
+
+
+def main():
+    now = datetime.now()
+    if now.hour < 9 or now.hour > 16:
+        return 0
+
+    scenario = get_scenario()
+    sid = scenario.get("id", "unknown")
+
+    with open(DECISIONS_PATH) as f:
+        data = json.load(f)
+    decisions = data.get("decisions", [])
+
+    for entry in decisions:
+        code = entry.get("code", "")
+        tree = entry.get("strategy_tree", {})
+        branches = tree.get("branches", [])
+        if not branches:
+            continue
+        price = get_price(code)
+        if not price:
+            continue
+        for br in sorted(branches, key=lambda b: b.get("priority", 999)):
+            if check_condition(br, sid, price):
+                br["trigger_count"] = br.get("trigger_count", 0) + 1
+                br["last_triggered"] = now.strftime("%Y-%m-%d")
+                break
+
+    # 写入 DB（替代 decisions.json）
+    try:
+        from mofin_db import get_conn, write_holding_strategy
+        conn = get_conn()
+        for e in data.get('decisions', []):
+            write_holding_strategy(conn, e.get('code', ''), e.get('name', ''), e)
+        conn.close()
+    except Exception:
+        pass
+
+    # 更新状态快照
+    state = {"scenario": sid, "updated_at": now.isoformat(), "branches": {}}
+    for e in decisions:
+        code = e.get("code", "")
+        tree = e.get("strategy_tree", {})
+        for br in sorted(tree.get("branches", []), key=lambda b: b.get("priority", 999)):
+            if check_condition(br, sid, get_price(code)):
+                state["branches"][code] = br.get("id", "")
+                break
+    try:
+        with open(SCANNER_STATE, "w") as f:
+            json.dump(state, f, indent=2)
+    except Exception:
+        pass
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
@@ -1,112 +1,115 @@
-#!/usr/bin/env python3
-"""
-prune_branches.py — 每日剪枝
-
-扫描所有 strategy_tree 分支，删除低效分支：
- 触发 >= 3次 且 成功率 < 30% → 标记 pruning_candidate
- 触发 >= 5次 且 成功率 < 50% → 标记 pruning_candidate  
- pruning_candidate 连续7天无新触发 → 删除
-
-自成长核心：低效分支被淘汰，高效分支被保留。
-数据写入 decisions.json 的 strategy_tree.branches[]。
-"""
-
-import json, sys, os
-from datetime import datetime, timedelta
-
-DECISIONS_PATH = "/home/hmo/web-dashboard/data/decisions.json"
-PRUNE_LOG = "/home/hmo/MoFin/data/prune_log.json"
-
-
-def load_decisions():
-    with open(DECISIONS_PATH) as f:
-        return json.load(f)
-
-
-def save_decisions(data):
-    with open(DECISIONS_PATH, "w") as f:
-        json.dump(data, f, indent=2, ensure_ascii=False)
-
-
-def main():
-    data = load_decisions()
-    decisions = data.get("decisions", [])
-    today = datetime.now().strftime("%Y-%m-%d")
-    pruned = []
-    warnings = []
-
-    for entry in decisions:
-        code = entry.get("code", "")
-        tree = entry.get("strategy_tree", {})
-        branches = tree.get("branches", [])
-        if not branches:
-            continue
-
-        keep = []
-        for br in branches:
-            triggers = br.get("trigger_count", 0)
-            success = br.get("success_rate")
-            last = br.get("last_triggered", "")
-            priority = br.get("priority", 99)
-
-            # 跳过默认持有分支
-            if priority == 99:
-                keep.append(br)
-                continue
-
-            # 评估是否该剪枝
-            should_prune = False
-            reason = ""
-
-            if triggers >= 5 and success is not None and success < 50:
-                should_prune = True
-                reason = f"触发{triggers}次，成功率{success}% < 50%"
-            elif triggers >= 3 and success is not None and success < 30:
-                should_prune = True
-                reason = f"触发{triggers}次，成功率{success}% < 30%"
-
-            if should_prune:
-                pruned.append({
-                    "code": code,
-                    "branch_id": br.get("id", ""),
-                    "action": br.get("action", {}).get("type", ""),
-                    "rationale": br.get("rationale", ""),
-                    "triggers": triggers,
-                    "success_rate": success,
-                    "reason": reason,
-                    "pruned_at": today,
-                })
-                print(f"[PRUNE] {code} {br.get('id','?')}: {reason}")
-            else:
-                keep.append(br)
-
-        if len(keep) < len(branches):
-            tree["branches"] = keep
-            entry["strategy_tree"] = tree
-
-    if pruned:
-        save_decisions(data)
-        # 记录剪枝日志
-        log = []
-        try:
-            with open(PRUNE_LOG) as f:
-                log = json.load(f)
-        except Exception:
-            pass
-        log.append({
-            "date": today,
-            "pruned": pruned,
-            "total_before": sum(len(e.get("strategy_tree", {}).get("branches", [])) for e in decisions),
-        })
-        os.makedirs(os.path.dirname(PRUNE_LOG), exist_ok=True)
-        with open(PRUNE_LOG, "w") as f:
-            json.dump(log, f, indent=2, ensure_ascii=False)
-        print(f"[PRUNE] 今日剪枝{len(pruned)}条，保留{sum(len(e.get('strategy_tree',{}).get('branches',[])) for e in decisions)}条")
-    else:
-        print("[PRUNE] 无需要剪枝的分支")
-
-    return 0
-
-
-if __name__ == "__main__":
-    sys.exit(main())
+#!/usr/bin/env python3
+"""
+prune_branches.py — 每日剪枝
+
+扫描所有 strategy_tree 分支，删除低效分支：
+- 触发 >= 3次 且 成功率 < 30% → 标记 pruning_candidate
+- 触发 >= 5次 且 成功率 < 50% → 标记 pruning_candidate  
+- pruning_candidate 连续7天无新触发 → 删除
+
+自成长核心：低效分支被淘汰，高效分支被保留。
+数据写入 decisions.json 的 strategy_tree.branches[]。
+"""
+
+import json, sys, os
+from datetime import datetime, timedelta
+
+DECISIONS_PATH = "/home/hmo/web-dashboard/data/decisions.json"
+PRUNE_LOG = "/home/hmo/MoFin/data/prune_log.json"
+
+
+def load_decisions():
+    from mo_data import read_decisions
+    return read_decisions()
+
+
+def save_decisions(data):
+    from mofin_db import get_conn, write_holding_strategy
+    conn = get_conn()
+    for e in data.get('decisions', []):
+        write_holding_strategy(conn, e.get('code', ''), e.get('name', ''), e)
+    conn.close()
+
+
+def main():
+    data = load_decisions()
+    decisions = data.get("decisions", [])
+    today = datetime.now().strftime("%Y-%m-%d")
+    pruned = []
+    warnings = []
+
+    for entry in decisions:
+        code = entry.get("code", "")
+        tree = entry.get("strategy_tree", {})
+        branches = tree.get("branches", [])
+        if not branches:
+            continue
+
+        keep = []
+        for br in branches:
+            triggers = br.get("trigger_count", 0)
+            success = br.get("success_rate")
+            last = br.get("last_triggered", "")
+            priority = br.get("priority", 99)
+
+            # 跳过默认持有分支
+            if priority == 99:
+                keep.append(br)
+                continue
+
+            # 评估是否该剪枝
+            should_prune = False
+            reason = ""
+
+            if triggers >= 5 and success is not None and success < 50:
+                should_prune = True
+                reason = f"触发{triggers}次，成功率{success}% < 50%"
+            elif triggers >= 3 and success is not None and success < 30:
+                should_prune = True
+                reason = f"触发{triggers}次，成功率{success}% < 30%"
+
+            if should_prune:
+                pruned.append({
+                    "code": code,
+                    "branch_id": br.get("id", ""),
+                    "action": br.get("action", {}).get("type", ""),
+                    "rationale": br.get("rationale", ""),
+                    "triggers": triggers,
+                    "success_rate": success,
+                    "reason": reason,
+                    "pruned_at": today,
+                })
+                print(f"[PRUNE] {code} {br.get('id','?')}: {reason}")
+            else:
+                keep.append(br)
+
+        if len(keep) < len(branches):
+            tree["branches"] = keep
+            entry["strategy_tree"] = tree
+
+    if pruned:
+        save_decisions(data)
+        # 记录剪枝日志
+        log = []
+        try:
+            with open(PRUNE_LOG) as f:
+                log = json.load(f)
+        except Exception:
+            pass
+        log.append({
+            "date": today,
+            "pruned": pruned,
+            "total_before": sum(len(e.get("strategy_tree", {}).get("branches", [])) for e in decisions),
+        })
+        os.makedirs(os.path.dirname(PRUNE_LOG), exist_ok=True)
+        with open(PRUNE_LOG, "w") as f:
+            json.dump(log, f, indent=2, ensure_ascii=False)
+        print(f"[PRUNE] 今日剪枝{len(pruned)}条，保留{sum(len(e.get('strategy_tree',{}).get('branches',[])) for e in decisions)}条")
+    else:
+        print("[PRUNE] 无需要剪枝的分支")
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
@@ -0,0 +1,37 @@
+"""Final verification: full data cycle after JSON→DB migration"""
+import sys
+sys.path.insert(0, '/home/hmo/MoFin')
+
+from mo_data import read_portfolio, read_decisions, read_watchlist
+
+pf = read_portfolio()
+dec = read_decisions()
+wl = read_watchlist()
+
+h = len(pf.get('holdings', []))
+d = len(dec.get('decisions', []))
+w = len(wl.get('stocks', []))
+
+print(f"portfolio holdings: {h}")
+print(f"decisions: {d}")
+print(f"watchlist: {w}")
+
+# Check one HK stock has correct CNY cost
+for holding in pf.get('holdings', []):
+    if holding.get('code') == '01888':
+        print(f"\n01888 cost={holding.get('cost')} price={holding.get('price')} curr={holding.get('currency')}")
+        c = holding.get('cost', 0); p = holding.get('price', 0)
+        if c and p:
+            print(f"P&L: {(p-c)/c*100:.1f}%")
+
+# Check decisions have currency=CNY
+cnys = sum(1 for d in dec.get('decisions', []) if d.get('currency') == 'CNY')
+print(f"\ndecisions with CNY: {cnys}/{d}")
+
+# Check no JSON fallback in mo_data (pure DB)
+with open('/home/hmo/MoFin/mo_data.py') as f:
+    content = f.read()
+    pure_db = 'json.load(open' not in content
+print(f"mo_data pure DB: {'YES' if pure_db else 'NO — still has JSON'}")
+
+print(f"\n{'ALL GOOD' if h and d and w else 'FAIL'}")
@@ -2029,19 +2029,6 @@ def regenerate_all(stdout=True):
        conn.close()
    except Exception as e:
        print(f"  [DB写入失败] {e}", flush=True)
-    # JSON 冷备
-    json.dump(existing_pf, open(PORTFOLIO_PATH, "w"), ensure_ascii=False, indent=2)
-    json.dump(wl, open(WATCHLIST_PATH, "w"), ensure_ascii=False, indent=2)
-
-    # 写 decisions.json
-    decisions_path = "/home/hmo/web-dashboard/data/decisions.json"
-    decisions_data = {
-        "decisions": decisions,  # 全部保留
-        "total": len(decisions),
-        "regenerated_at": datetime.now().strftime('%Y-%m-%d %H:%M'),
-    }
-    json.dump(decisions_data, open(decisions_path, "w"), ensure_ascii=False, indent=2)
-    # DB 已在上方写入（和 portfolio/watchlist 一起）

    # 记录策略→提示词版本关联
    if HAS_PROMPT_TRACKING:
@@ -2540,19 +2540,6 @@ def regenerate_all(stdout=True):
        conn.close()
    except Exception as e:
        print(f"  [DB写入失败] {e}", flush=True)
-    # JSON 冷备
-    json.dump(existing_pf, open(PORTFOLIO_PATH, "w"), ensure_ascii=False, indent=2)
-    json.dump(wl, open(WATCHLIST_PATH, "w"), ensure_ascii=False, indent=2)
-
-    # 写 decisions.json
-    decisions_path = "/home/hmo/web-dashboard/data/decisions.json"
-    decisions_data = {
-        "decisions": decisions,  # 全部保留
-        "total": len(decisions),
-        "regenerated_at": datetime.now().strftime('%Y-%m-%d %H:%M'),
-    }
-    json.dump(decisions_data, open(decisions_path, "w"), ensure_ascii=False, indent=2)
-    # DB 已在上方写入（和 portfolio/watchlist 一起）

    # 记录策略→提示词版本关联
    if HAS_PROMPT_TRACKING: