test_app_utils.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277
  1. import math
  2. import unittest
  3. import pandas as pd
  4. from app_utils import (
  5. apply_defect_filters,
  6. build_html_report,
  7. build_ml_factor_insights,
  8. build_diagnostic_dashboard,
  9. classify_panel_zone,
  10. calculate_kpis,
  11. calculate_spc_metrics,
  12. generate_industry_diagnosis,
  13. normalize_defect_schema,
  14. )
  15. class AppUtilsTest(unittest.TestCase):
  16. def setUp(self):
  17. self.df = pd.DataFrame(
  18. {
  19. "defect_id": ["D1", "D2", "D3", "D4"],
  20. "panel_id": ["P1", "P2", "P2", "P3"],
  21. "batch_id": ["B1", "B1", "B2", "B2"],
  22. "equipment_id": ["E1", "E1", "E2", "E2"],
  23. "seat_id": ["S1", "S2", "S1", "S2"],
  24. "timestamp": pd.to_datetime(
  25. [
  26. "2026-04-01 00:00:00",
  27. "2026-04-01 23:59:59",
  28. "2026-04-02 12:00:00",
  29. "2026-04-03 00:00:01",
  30. ]
  31. ),
  32. "defect_type": ["划痕", "亮点", "划痕", "暗点"],
  33. "severity": ["严重", "轻微", "中等", "严重"],
  34. "shift": ["白班", "夜班", "白班", "白班"],
  35. "day": ["2026-04-01", "2026-04-01", "2026-04-02", "2026-04-03"],
  36. }
  37. )
  38. def test_date_filter_includes_full_end_date(self):
  39. filtered = apply_defect_filters(
  40. self.df,
  41. start_date=pd.Timestamp("2026-04-01"),
  42. end_date=pd.Timestamp("2026-04-01"),
  43. selected_types=["划痕", "亮点", "暗点"],
  44. selected_batches=["B1", "B2"],
  45. selected_equipment=["E1", "E2"],
  46. selected_seats=["S1", "S2"],
  47. selected_shift="全部",
  48. selected_severity="全部",
  49. )
  50. self.assertEqual(["D1", "D2"], filtered["defect_id"].tolist())
  51. def test_kpis_use_same_filter_scope_for_total_panels(self):
  52. filtered = apply_defect_filters(
  53. self.df,
  54. start_date=pd.Timestamp("2026-04-01"),
  55. end_date=pd.Timestamp("2026-04-02"),
  56. selected_types=["划痕"],
  57. selected_batches=["B1", "B2"],
  58. selected_equipment=["E1", "E2"],
  59. selected_seats=["S1"],
  60. selected_shift="全部",
  61. selected_severity="全部",
  62. )
  63. kpis = calculate_kpis(self.df, filtered)
  64. self.assertEqual(2, kpis["total_panels_inspected"])
  65. self.assertEqual(2, kpis["defective_panels"])
  66. self.assertEqual(0.0, kpis["yield_rate"])
  67. def test_spc_metrics_clamp_estimated_rate_to_valid_probability(self):
  68. metrics = calculate_spc_metrics(self.df)
  69. self.assertTrue(math.isfinite(metrics["p_bar"]))
  70. self.assertTrue(math.isfinite(metrics["ucl"]))
  71. self.assertTrue(math.isfinite(metrics["lcl"]))
  72. self.assertLessEqual(metrics["daily"]["defect_rate"].max(), 1.0)
  73. def test_diagnostic_dashboard_ranks_root_cause_candidates(self):
  74. dashboard = build_diagnostic_dashboard(self.df)
  75. self.assertEqual("严重", dashboard["severity_level"])
  76. self.assertEqual("E1 / S1", dashboard["root_causes"].iloc[0]["根因候选"])
  77. self.assertEqual("划痕", dashboard["top_defect_type"])
  78. self.assertIn("优先排查", dashboard["primary_recommendation"])
  79. def test_diagnostic_dashboard_reports_baseline_lift(self):
  80. rows = []
  81. for i in range(10):
  82. rows.append(
  83. {
  84. "defect_id": f"D{i}",
  85. "panel_id": f"P{i}",
  86. "batch_id": "B1",
  87. "equipment_id": "E1",
  88. "seat_id": "S-hot" if i < 8 else "S-cold",
  89. "timestamp": pd.Timestamp("2026-04-01"),
  90. "defect_type": "气泡",
  91. "severity": "严重" if i < 2 else "轻微",
  92. "shift": "白班",
  93. "day": "2026-04-01",
  94. }
  95. )
  96. df = pd.DataFrame(rows)
  97. dashboard = build_diagnostic_dashboard(df)
  98. top = dashboard["root_causes"].iloc[0]
  99. self.assertEqual("E1 / S-hot", top["根因候选"])
  100. self.assertGreater(top["异常倍数"], 1.0)
  101. def test_classify_panel_zone_uses_3c_panel_regions(self):
  102. zones = classify_panel_zone(
  103. pd.DataFrame(
  104. {
  105. "x_mm": [2.0, 77.5, 150.0, 80.0],
  106. "y_mm": [335.0, 255.0, 170.0, 20.0],
  107. "panel_width_mm": [155.0] * 4,
  108. "panel_height_mm": [340.0] * 4,
  109. }
  110. )
  111. )
  112. self.assertIn("角落区", zones.iloc[0])
  113. self.assertIn("FPC/绑定区", zones.iloc[1])
  114. self.assertIn("右边缘区", zones.iloc[2])
  115. self.assertIn("下边缘区", zones.iloc[3])
  116. def test_industry_diagnosis_generates_panel_sop_recommendation(self):
  117. rows = []
  118. for i in range(12):
  119. rows.append(
  120. {
  121. "defect_id": f"D{i}",
  122. "panel_id": f"P{i}",
  123. "batch_id": "B1",
  124. "equipment_id": "LAM-A01",
  125. "seat_id": "R2C3",
  126. "timestamp": pd.Timestamp("2026-04-01"),
  127. "defect_type": "气泡",
  128. "severity": "严重" if i < 4 else "中等",
  129. "x_mm": 5.0 + i * 0.3,
  130. "y_mm": 250.0,
  131. "panel_width_mm": 155.0,
  132. "panel_height_mm": 340.0,
  133. "shift": "白班",
  134. "day": "2026-04-01",
  135. }
  136. )
  137. df = pd.DataFrame(rows)
  138. dashboard = build_diagnostic_dashboard(df)
  139. diagnosis = generate_industry_diagnosis(df, dashboard)
  140. self.assertIn("边缘", diagnosis["headline"])
  141. self.assertIn("气泡", diagnosis["headline"])
  142. self.assertTrue(any("贴合" in item for item in diagnosis["recommendations"]))
  143. self.assertTrue(any("跨面板重复" in pattern for pattern in diagnosis["patterns"]))
  144. def test_normalize_defect_schema_backfills_industry_fields(self):
  145. normalized = normalize_defect_schema(self.df)
  146. self.assertIn("defect_geometry_type", normalized.columns)
  147. self.assertIn("lam_equipment_id", normalized.columns)
  148. self.assertIn("clean_equipment_id", normalized.columns)
  149. self.assertEqual(["point"] * len(normalized), normalized["defect_geometry_type"].tolist())
  150. self.assertEqual(normalized["equipment_id"].tolist(), normalized["lam_equipment_id"].tolist())
  151. self.assertEqual(normalized["seat_id"].tolist(), normalized["lam_seat_id"].tolist())
  152. self.assertTrue((normalized["area_mm2"] >= 0).all())
  153. def test_diagnostic_dashboard_includes_extended_root_causes(self):
  154. rows = []
  155. for i in range(12):
  156. rows.append(
  157. {
  158. "defect_id": f"D{i}",
  159. "panel_id": f"P{i}",
  160. "batch_id": "B1",
  161. "equipment_id": "LAM-A01",
  162. "seat_id": f"R{i % 4 + 1}C1",
  163. "inspection_station": "AOI-1",
  164. "timestamp": pd.Timestamp("2026-04-01"),
  165. "defect_type": "划痕",
  166. "severity": "严重" if i < 4 else "轻微",
  167. "x_mm": 10 + i,
  168. "y_mm": 20 + i,
  169. "panel_width_mm": 155.0,
  170. "panel_height_mm": 340.0,
  171. "hour": 8,
  172. "shift": "白班",
  173. "day": "2026-04-01",
  174. "lam_fixture_id": "FIX-HOT" if i < 9 else "FIX-OK",
  175. "lam_nozzle_id": "NZ-01" if i < 9 else "NZ-02",
  176. "material_lot_oca": "OCA-HOT" if i < 9 else "OCA-OK",
  177. }
  178. )
  179. df = normalize_defect_schema(pd.DataFrame(rows))
  180. dashboard = build_diagnostic_dashboard(df)
  181. extended = dashboard["extended_root_causes"]
  182. self.assertFalse(extended.empty)
  183. self.assertEqual("lam_fixture_id", extended.iloc[0]["维度"])
  184. self.assertEqual("FIX-HOT", extended.iloc[0]["候选值"])
  185. self.assertGreater(extended.iloc[0]["异常倍数"], 1.0)
  186. def test_ml_factor_insights_include_model_audit_outputs(self):
  187. rows = []
  188. for i in range(40):
  189. hot = i < 24
  190. rows.append(
  191. {
  192. "defect_id": f"D{i}",
  193. "panel_id": f"P{i}",
  194. "batch_id": "B1",
  195. "equipment_id": "LAM-A01" if hot else "LAM-B01",
  196. "seat_id": "R1C1" if hot else "R2C2",
  197. "inspection_station": "AOI-1",
  198. "timestamp": pd.Timestamp("2026-04-01 08:00:00"),
  199. "defect_type": "气泡" if hot else "划痕",
  200. "severity": "严重" if i % 5 == 0 else "轻微",
  201. "x_mm": 10.0 + i,
  202. "y_mm": 20.0,
  203. "panel_width_mm": 155.0,
  204. "panel_height_mm": 340.0,
  205. "hour": 8,
  206. "shift": "白班",
  207. "day": "2026-04-01",
  208. "lam_fixture_id": "FIX-HOT" if hot else "FIX-OK",
  209. "material_lot_oca": "OCA-HOT" if hot else "OCA-OK",
  210. }
  211. )
  212. df = normalize_defect_schema(pd.DataFrame(rows))
  213. insights = build_ml_factor_insights(df, target_defect_type="气泡", model_name="random_forest", top_n=5)
  214. self.assertIsNone(insights["error"])
  215. self.assertEqual("气泡", insights["target_defect_type"])
  216. self.assertFalse(insights["key_factors"].empty)
  217. self.assertIn("validation_auc", insights["validation_metrics"])
  218. self.assertGreater(len(insights["feature_importance"]), 0)
  219. def test_build_html_report_creates_self_contained_safe_webpage(self):
  220. html = build_html_report(
  221. generated_at="2026-05-18 10:00:00",
  222. date_range_text="2026-04-01 ~ 2026-04-30",
  223. view_mode="工程师",
  224. defect_count=12,
  225. panel_count=8,
  226. kpis={
  227. "total_panels_inspected": 8,
  228. "defective_panels": 3,
  229. "yield_rate": 62.5,
  230. "critical_defects": 2,
  231. },
  232. type_counts=pd.Series({"气泡<script>": 7, "划痕": 5}),
  233. equipment_counts=pd.Series({"LAM-A01": 9}),
  234. seat_top=pd.Series({"R1C1": 4}),
  235. trend_summary="缺陷数趋势: 上升",
  236. anomaly_rows=[{"equipment": "LAM-A01", "seat": "R1C1", "count": 4}],
  237. recommendations=["重点关注气泡"],
  238. )
  239. self.assertIn("<!doctype html>", html.lower())
  240. self.assertIn("缺陷集中性分析综合报告", html)
  241. self.assertIn("气泡&lt;script&gt;", html)
  242. self.assertNotIn("气泡<script>", html)
  243. if __name__ == "__main__":
  244. unittest.main()