test_app_utils.py 9.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250
  1. import math
  2. import unittest
  3. import pandas as pd
  4. from app_utils import (
  5. apply_defect_filters,
  6. build_ml_factor_insights,
  7. build_diagnostic_dashboard,
  8. classify_panel_zone,
  9. calculate_kpis,
  10. calculate_spc_metrics,
  11. generate_industry_diagnosis,
  12. normalize_defect_schema,
  13. )
  14. class AppUtilsTest(unittest.TestCase):
  15. def setUp(self):
  16. self.df = pd.DataFrame(
  17. {
  18. "defect_id": ["D1", "D2", "D3", "D4"],
  19. "panel_id": ["P1", "P2", "P2", "P3"],
  20. "batch_id": ["B1", "B1", "B2", "B2"],
  21. "equipment_id": ["E1", "E1", "E2", "E2"],
  22. "seat_id": ["S1", "S2", "S1", "S2"],
  23. "timestamp": pd.to_datetime(
  24. [
  25. "2026-04-01 00:00:00",
  26. "2026-04-01 23:59:59",
  27. "2026-04-02 12:00:00",
  28. "2026-04-03 00:00:01",
  29. ]
  30. ),
  31. "defect_type": ["划痕", "亮点", "划痕", "暗点"],
  32. "severity": ["严重", "轻微", "中等", "严重"],
  33. "shift": ["白班", "夜班", "白班", "白班"],
  34. "day": ["2026-04-01", "2026-04-01", "2026-04-02", "2026-04-03"],
  35. }
  36. )
  37. def test_date_filter_includes_full_end_date(self):
  38. filtered = apply_defect_filters(
  39. self.df,
  40. start_date=pd.Timestamp("2026-04-01"),
  41. end_date=pd.Timestamp("2026-04-01"),
  42. selected_types=["划痕", "亮点", "暗点"],
  43. selected_batches=["B1", "B2"],
  44. selected_equipment=["E1", "E2"],
  45. selected_seats=["S1", "S2"],
  46. selected_shift="全部",
  47. selected_severity="全部",
  48. )
  49. self.assertEqual(["D1", "D2"], filtered["defect_id"].tolist())
  50. def test_kpis_use_same_filter_scope_for_total_panels(self):
  51. filtered = apply_defect_filters(
  52. self.df,
  53. start_date=pd.Timestamp("2026-04-01"),
  54. end_date=pd.Timestamp("2026-04-02"),
  55. selected_types=["划痕"],
  56. selected_batches=["B1", "B2"],
  57. selected_equipment=["E1", "E2"],
  58. selected_seats=["S1"],
  59. selected_shift="全部",
  60. selected_severity="全部",
  61. )
  62. kpis = calculate_kpis(self.df, filtered)
  63. self.assertEqual(2, kpis["total_panels_inspected"])
  64. self.assertEqual(2, kpis["defective_panels"])
  65. self.assertEqual(0.0, kpis["yield_rate"])
  66. def test_spc_metrics_clamp_estimated_rate_to_valid_probability(self):
  67. metrics = calculate_spc_metrics(self.df)
  68. self.assertTrue(math.isfinite(metrics["p_bar"]))
  69. self.assertTrue(math.isfinite(metrics["ucl"]))
  70. self.assertTrue(math.isfinite(metrics["lcl"]))
  71. self.assertLessEqual(metrics["daily"]["defect_rate"].max(), 1.0)
  72. def test_diagnostic_dashboard_ranks_root_cause_candidates(self):
  73. dashboard = build_diagnostic_dashboard(self.df)
  74. self.assertEqual("严重", dashboard["severity_level"])
  75. self.assertEqual("E1 / S1", dashboard["root_causes"].iloc[0]["根因候选"])
  76. self.assertEqual("划痕", dashboard["top_defect_type"])
  77. self.assertIn("优先排查", dashboard["primary_recommendation"])
  78. def test_diagnostic_dashboard_reports_baseline_lift(self):
  79. rows = []
  80. for i in range(10):
  81. rows.append(
  82. {
  83. "defect_id": f"D{i}",
  84. "panel_id": f"P{i}",
  85. "batch_id": "B1",
  86. "equipment_id": "E1",
  87. "seat_id": "S-hot" if i < 8 else "S-cold",
  88. "timestamp": pd.Timestamp("2026-04-01"),
  89. "defect_type": "气泡",
  90. "severity": "严重" if i < 2 else "轻微",
  91. "shift": "白班",
  92. "day": "2026-04-01",
  93. }
  94. )
  95. df = pd.DataFrame(rows)
  96. dashboard = build_diagnostic_dashboard(df)
  97. top = dashboard["root_causes"].iloc[0]
  98. self.assertEqual("E1 / S-hot", top["根因候选"])
  99. self.assertGreater(top["异常倍数"], 1.0)
  100. def test_classify_panel_zone_uses_3c_panel_regions(self):
  101. zones = classify_panel_zone(
  102. pd.DataFrame(
  103. {
  104. "x_mm": [2.0, 77.5, 150.0, 80.0],
  105. "y_mm": [335.0, 255.0, 170.0, 20.0],
  106. "panel_width_mm": [155.0] * 4,
  107. "panel_height_mm": [340.0] * 4,
  108. }
  109. )
  110. )
  111. self.assertIn("角落区", zones.iloc[0])
  112. self.assertIn("FPC/绑定区", zones.iloc[1])
  113. self.assertIn("右边缘区", zones.iloc[2])
  114. self.assertIn("下边缘区", zones.iloc[3])
  115. def test_industry_diagnosis_generates_panel_sop_recommendation(self):
  116. rows = []
  117. for i in range(12):
  118. rows.append(
  119. {
  120. "defect_id": f"D{i}",
  121. "panel_id": f"P{i}",
  122. "batch_id": "B1",
  123. "equipment_id": "LAM-A01",
  124. "seat_id": "R2C3",
  125. "timestamp": pd.Timestamp("2026-04-01"),
  126. "defect_type": "气泡",
  127. "severity": "严重" if i < 4 else "中等",
  128. "x_mm": 5.0 + i * 0.3,
  129. "y_mm": 250.0,
  130. "panel_width_mm": 155.0,
  131. "panel_height_mm": 340.0,
  132. "shift": "白班",
  133. "day": "2026-04-01",
  134. }
  135. )
  136. df = pd.DataFrame(rows)
  137. dashboard = build_diagnostic_dashboard(df)
  138. diagnosis = generate_industry_diagnosis(df, dashboard)
  139. self.assertIn("边缘", diagnosis["headline"])
  140. self.assertIn("气泡", diagnosis["headline"])
  141. self.assertTrue(any("贴合" in item for item in diagnosis["recommendations"]))
  142. self.assertTrue(any("跨面板重复" in pattern for pattern in diagnosis["patterns"]))
  143. def test_normalize_defect_schema_backfills_industry_fields(self):
  144. normalized = normalize_defect_schema(self.df)
  145. self.assertIn("defect_geometry_type", normalized.columns)
  146. self.assertIn("lam_equipment_id", normalized.columns)
  147. self.assertIn("clean_equipment_id", normalized.columns)
  148. self.assertEqual(["point"] * len(normalized), normalized["defect_geometry_type"].tolist())
  149. self.assertEqual(normalized["equipment_id"].tolist(), normalized["lam_equipment_id"].tolist())
  150. self.assertEqual(normalized["seat_id"].tolist(), normalized["lam_seat_id"].tolist())
  151. self.assertTrue((normalized["area_mm2"] >= 0).all())
  152. def test_diagnostic_dashboard_includes_extended_root_causes(self):
  153. rows = []
  154. for i in range(12):
  155. rows.append(
  156. {
  157. "defect_id": f"D{i}",
  158. "panel_id": f"P{i}",
  159. "batch_id": "B1",
  160. "equipment_id": "LAM-A01",
  161. "seat_id": f"R{i % 4 + 1}C1",
  162. "inspection_station": "AOI-1",
  163. "timestamp": pd.Timestamp("2026-04-01"),
  164. "defect_type": "划痕",
  165. "severity": "严重" if i < 4 else "轻微",
  166. "x_mm": 10 + i,
  167. "y_mm": 20 + i,
  168. "panel_width_mm": 155.0,
  169. "panel_height_mm": 340.0,
  170. "hour": 8,
  171. "shift": "白班",
  172. "day": "2026-04-01",
  173. "lam_fixture_id": "FIX-HOT" if i < 9 else "FIX-OK",
  174. "lam_nozzle_id": "NZ-01" if i < 9 else "NZ-02",
  175. "material_lot_oca": "OCA-HOT" if i < 9 else "OCA-OK",
  176. }
  177. )
  178. df = normalize_defect_schema(pd.DataFrame(rows))
  179. dashboard = build_diagnostic_dashboard(df)
  180. extended = dashboard["extended_root_causes"]
  181. self.assertFalse(extended.empty)
  182. self.assertEqual("lam_fixture_id", extended.iloc[0]["维度"])
  183. self.assertEqual("FIX-HOT", extended.iloc[0]["候选值"])
  184. self.assertGreater(extended.iloc[0]["异常倍数"], 1.0)
  185. def test_ml_factor_insights_include_model_audit_outputs(self):
  186. rows = []
  187. for i in range(40):
  188. hot = i < 24
  189. rows.append(
  190. {
  191. "defect_id": f"D{i}",
  192. "panel_id": f"P{i}",
  193. "batch_id": "B1",
  194. "equipment_id": "LAM-A01" if hot else "LAM-B01",
  195. "seat_id": "R1C1" if hot else "R2C2",
  196. "inspection_station": "AOI-1",
  197. "timestamp": pd.Timestamp("2026-04-01 08:00:00"),
  198. "defect_type": "气泡" if hot else "划痕",
  199. "severity": "严重" if i % 5 == 0 else "轻微",
  200. "x_mm": 10.0 + i,
  201. "y_mm": 20.0,
  202. "panel_width_mm": 155.0,
  203. "panel_height_mm": 340.0,
  204. "hour": 8,
  205. "shift": "白班",
  206. "day": "2026-04-01",
  207. "lam_fixture_id": "FIX-HOT" if hot else "FIX-OK",
  208. "material_lot_oca": "OCA-HOT" if hot else "OCA-OK",
  209. }
  210. )
  211. df = normalize_defect_schema(pd.DataFrame(rows))
  212. insights = build_ml_factor_insights(df, target_defect_type="气泡", model_name="random_forest", top_n=5)
  213. self.assertIsNone(insights["error"])
  214. self.assertEqual("气泡", insights["target_defect_type"])
  215. self.assertFalse(insights["key_factors"].empty)
  216. self.assertIn("validation_auc", insights["validation_metrics"])
  217. self.assertGreater(len(insights["feature_importance"]), 0)
  218. if __name__ == "__main__":
  219. unittest.main()