case_embed_store.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348
  1. """
  2. 典型案例库-固定结构:
  3. {
  4. "case_id": "string",
  5. "expense_type": "PERSONAL | BUSINESS",
  6. "category": "string",
  7. "subcategory": "string",
  8. "invoice_item": "string",
  9. "seller_profile": "string",
  10. "decision": "PERSONAL | BUSINESS",
  11. "risk_level": "LOW | MEDIUM | HIGH",
  12. "decision_reason": ["string"],
  13. "embedding_text": "string",
  14. "source": "string"
  15. }
  16. """
  17. case_embed = [
  18. {
  19. "case_id": "CASE-PER-EDU-001",
  20. "expense_type": "PERSONAL",
  21. "category": "教育",
  22. "subcategory": "学费",
  23. "invoice_item": "某大学学费",
  24. "seller_profile": "高等教育机构",
  25. "decision": "PERSONAL",
  26. "risk_level": "HIGH",
  27. "decision_reason": [
  28. "费用为个人学历教育学费",
  29. "与企业主营业务无直接关联"
  30. ],
  31. "embedding_text": "该发票内容为大学学费,属于个人学历教育支出,主要用于个人受教育目的,与企业日常经营活动无直接关系,因此判定为个人消费。",
  32. "source": "人工审核确认"
  33. }
  34. , {
  35. "case_id": "CASE-PER-EDU-002",
  36. "expense_type": "PERSONAL",
  37. "category": "教育",
  38. "subcategory": "兴趣培训",
  39. "invoice_item": "少儿美术兴趣班培训费",
  40. "seller_profile": "教育培训机构",
  41. "decision": "PERSONAL",
  42. "risk_level": "HIGH",
  43. "decision_reason": [
  44. "兴趣类培训不属于企业经营支出",
  45. "培训对象为个人或家庭成员"
  46. ],
  47. "embedding_text": "发票项目为兴趣班培训费用,例如美术、音乐等兴趣课程,主要用于个人或家庭教育需求,不属于企业经营活动支出,通常应判定为个人消费。",
  48. "source": "人工审核确认"
  49. },
  50. {
  51. "case_id": "CASE-PER-CLOTH-003",
  52. "expense_type": "PERSONAL",
  53. "category": "个人消费",
  54. "subcategory": "服饰",
  55. "invoice_item": "服装购买费用",
  56. "seller_profile": "服装零售商",
  57. "decision": "PERSONAL",
  58. "risk_level": "HIGH",
  59. "decision_reason": [
  60. "服装为个人日常穿着用品",
  61. "非企业统一采购工装"
  62. ],
  63. "embedding_text": "该发票为服装购买费用,商品为个人日常穿着服饰,并非企业统一采购的工装或制服,与企业经营活动无直接关系,判定为个人消费。",
  64. "source": "人工审核确认"
  65. }
  66. ,
  67. {
  68. "case_id": "CASE-PER-COS-004",
  69. "expense_type": "PERSONAL",
  70. "category": "个人消费",
  71. "subcategory": "化妆品",
  72. "invoice_item": "护肤品及化妆品购买",
  73. "seller_profile": "化妆品零售商",
  74. "decision": "PERSONAL",
  75. "risk_level": "HIGH",
  76. "decision_reason": [
  77. "化妆品为个人形象消费",
  78. "无业务用途说明"
  79. ],
  80. "embedding_text": "发票内容为化妆品、护肤品等个人形象相关消费,主要满足个人生活和形象管理需求,未体现企业业务用途,应判定为个人消费。",
  81. "source": "人工审核确认"
  82. }
  83. , {
  84. "case_id": "CASE-PER-JEWEL-005",
  85. "expense_type": "PERSONAL",
  86. "category": "个人消费",
  87. "subcategory": "首饰",
  88. "invoice_item": "黄金首饰购买",
  89. "seller_profile": "珠宝首饰商户",
  90. "decision": "PERSONAL",
  91. "risk_level": "HIGH",
  92. "decision_reason": [
  93. "首饰为个人佩戴用品",
  94. "不属于企业资产或业务礼品"
  95. ],
  96. "embedding_text": "该发票为首饰、珠宝类购买费用,商品具有明显的个人装饰属性,与企业经营活动无直接关联,通常判定为个人消费。",
  97. "source": "人工审核确认"
  98. },
  99. {
  100. "case_id": "CASE-PER-MED-006",
  101. "expense_type": "PERSONAL",
  102. "category": "医疗健康",
  103. "subcategory": "体检",
  104. "invoice_item": "个人体检服务费",
  105. "seller_profile": "医疗体检机构",
  106. "decision": "PERSONAL",
  107. "risk_level": "MEDIUM",
  108. "decision_reason": [
  109. "体检对象为个人",
  110. "非企业统一员工体检"
  111. ],
  112. "embedding_text": "发票项目为个人体检服务费用,用于个人健康检查,未标注为企业统一员工体检福利,因此判定为个人消费。",
  113. "source": "人工审核确认"
  114. }
  115. , {
  116. "case_id": "CASE-PER-HEALTH-007",
  117. "expense_type": "PERSONAL",
  118. "category": "医疗健康",
  119. "subcategory": "保健品",
  120. "invoice_item": "营养保健品购买",
  121. "seller_profile": "保健品销售商",
  122. "decision": "PERSONAL",
  123. "risk_level": "HIGH",
  124. "decision_reason": [
  125. "保健品用于个人健康调养",
  126. "非企业统一福利"
  127. ],
  128. "embedding_text": "该发票为营养品、保健品等健康相关消费,主要用于个人身体调养和保健需求,与企业经营活动无直接关系,应判定为个人消费。",
  129. "source": "人工审核确认"
  130. }
  131. , {
  132. "case_id": "CASE-PER-ENT-008",
  133. "expense_type": "PERSONAL",
  134. "category": "文体娱乐",
  135. "subcategory": "电影",
  136. "invoice_item": "电影票费用",
  137. "seller_profile": "电影院",
  138. "decision": "PERSONAL",
  139. "risk_level": "HIGH",
  140. "decision_reason": [
  141. "电影票为个人娱乐消费",
  142. "无员工活动或团建说明"
  143. ],
  144. "embedding_text": "发票内容为电影票或观影服务费用,属于典型个人娱乐消费,与企业经营活动无直接关系,通常判定为个人消费。",
  145. "source": "人工审核确认"
  146. }
  147. , {
  148. "case_id": "CASE-PER-KTV-009",
  149. "expense_type": "PERSONAL",
  150. "category": "文体娱乐",
  151. "subcategory": "KTV",
  152. "invoice_item": "KTV 包厢消费",
  153. "seller_profile": "娱乐服务场所",
  154. "decision": "PERSONAL",
  155. "risk_level": "HIGH",
  156. "decision_reason": [
  157. "KTV 为娱乐性质消费",
  158. "未标注为客户接待或团建"
  159. ],
  160. "embedding_text": "该发票为 KTV 包厢或娱乐消费费用,具有明显个人娱乐属性,未体现业务接待或公司活动背景,应判定为个人消费。",
  161. "source": "人工审核确认"
  162. }
  163. , {
  164. "case_id": "CASE-PER-FIT-010",
  165. "expense_type": "PERSONAL",
  166. "category": "文体娱乐",
  167. "subcategory": "健身",
  168. "invoice_item": "健身房年卡会员费",
  169. "seller_profile": "健身服务机构",
  170. "decision": "PERSONAL",
  171. "risk_level": "HIGH",
  172. "decision_reason": [
  173. "健身卡为个人健身用途",
  174. "非企业统一员工福利"
  175. ],
  176. "embedding_text": "发票项目为健身房会员年卡或健身卡费用,主要用于个人身体锻炼和健康管理,通常不属于企业经营支出,应判定为个人消费。",
  177. "source": "人工审核确认"
  178. }
  179. , {
  180. "case_id": "CASE-PER-TRAVEL-011",
  181. "expense_type": "PERSONAL",
  182. "category": "出行旅游",
  183. "subcategory": "私人旅游",
  184. "invoice_item": "景区门票及旅游服务费",
  185. "seller_profile": "旅游服务商",
  186. "decision": "PERSONAL",
  187. "risk_level": "HIGH",
  188. "decision_reason": [
  189. "旅游行为为私人出行",
  190. "无商务出差或会议说明"
  191. ],
  192. "embedding_text": "该发票为私人旅游相关费用,如景区门票或旅游服务费,主要用于个人休闲活动,与企业经营活动无直接关系,应判定为个人消费。",
  193. "source": "人工审核确认"
  194. }
  195. , {
  196. "case_id": "CASE-BIZ-MED-101",
  197. "expense_type": "BUSINESS",
  198. "category": "员工福利",
  199. "subcategory": "员工体检",
  200. "invoice_item": "年度员工健康体检服务费",
  201. "seller_profile": "医疗体检机构",
  202. "decision": "BUSINESS",
  203. "risk_level": "LOW",
  204. "decision_reason": [
  205. "体检为企业统一组织",
  206. "费用由企业统一支付",
  207. "属于员工福利支出"
  208. ],
  209. "embedding_text": "该发票内容为员工健康体检服务费用,虽然体检本身具有个人属性,但本案例中体检由企业统一安排并出资,作为员工福利项目,与企业人力资源管理相关,因此判定为企业支出。",
  210. "source": "人工审核确认"
  211. }
  212. , {
  213. "case_id": "CASE-BIZ-FIT-102",
  214. "expense_type": "BUSINESS",
  215. "category": "员工福利",
  216. "subcategory": "健身福利",
  217. "invoice_item": "员工健身房年卡费用",
  218. "seller_profile": "健身服务机构",
  219. "decision": "BUSINESS",
  220. "risk_level": "LOW",
  221. "decision_reason": [
  222. "健身卡为企业统一采购",
  223. "用于员工福利",
  224. "非个人自行消费"
  225. ],
  226. "embedding_text": "发票项目为健身房年卡费用,表面上属于个人健身消费,但该费用由企业统一采购并发放给员工,作为员工福利项目,与企业员工关怀和福利制度相关,因此判定为企业支出。",
  227. "source": "人工审核确认"
  228. }
  229. , {
  230. "case_id": "CASE-BIZ-CLOTH-103",
  231. "expense_type": "BUSINESS",
  232. "category": "经营支出",
  233. "subcategory": "工装制服",
  234. "invoice_item": "员工工作服及制服采购费",
  235. "seller_profile": "服装生产及销售商",
  236. "decision": "BUSINESS",
  237. "risk_level": "LOW",
  238. "decision_reason": [
  239. "服装为企业统一采购",
  240. "用于员工工作场景",
  241. "不属于个人日常服饰"
  242. ],
  243. "embedding_text": "该发票为员工工作服或制服采购费用,虽然商品本身为服饰,但其用途明确为企业统一配置的工作服,用于业务或岗位需要,与个人日常穿着无关,因此判定为企业经营支出。",
  244. "source": "人工审核确认"
  245. }
  246. , {
  247. "case_id": "CASE-BIZ-ENT-104",
  248. "expense_type": "BUSINESS",
  249. "category": "员工福利",
  250. "subcategory": "团建活动",
  251. "invoice_item": "员工团建娱乐活动费用",
  252. "seller_profile": "影院 / KTV / 娱乐服务商",
  253. "decision": "BUSINESS",
  254. "risk_level": "MEDIUM",
  255. "decision_reason": [
  256. "活动为企业统一组织",
  257. "参与对象为员工集体",
  258. "费用由企业统一承担"
  259. ],
  260. "embedding_text": "发票内容为电影票、KTV 或其他娱乐活动费用,表面上属于个人娱乐消费,但该活动为企业统一组织的员工团建项目,费用由企业承担,属于员工福利或团队建设支出,因此判定为企业支出。",
  261. "source": "人工审核确认"
  262. }, {
  263. "case_id": "CASE-BIZ-EDU-105",
  264. "expense_type": "BUSINESS",
  265. "category": "经营支出",
  266. "subcategory": "员工培训",
  267. "invoice_item": "员工岗位技能培训费",
  268. "seller_profile": "职业培训机构",
  269. "decision": "BUSINESS",
  270. "risk_level": "LOW",
  271. "decision_reason": [
  272. "培训与岗位技能直接相关",
  273. "由企业统一组织",
  274. "属于经营所需支出"
  275. ],
  276. "embedding_text": "该发票为员工岗位技能培训费用,虽然形式上为教育培训支出,但培训内容直接服务于员工岗位能力提升,由企业统一安排并支付,属于企业经营所需支出,因此判定为企业支出。",
  277. "source": "人工审核确认"
  278. }
  279. , {
  280. "case_id": "CASE-BIZ-COS-106",
  281. "expense_type": "BUSINESS",
  282. "category": "经营支出",
  283. "subcategory": "业务用品",
  284. "invoice_item": "展示及业务用化妆品采购",
  285. "seller_profile": "化妆品供应商",
  286. "decision": "BUSINESS",
  287. "risk_level": "MEDIUM",
  288. "decision_reason": [
  289. "化妆品用于业务展示或客户体验",
  290. "非个人日常使用"
  291. ],
  292. "embedding_text": "该发票为化妆品或护肤品采购费用,商品本身具有个人消费特征,但在本案例中用于业务展示、客户体验或工作需要,并非个人日常使用,因此判定为企业经营支出。",
  293. "source": "人工审核确认"
  294. }
  295. , {
  296. "case_id": "CASE-BIZ-GIFT-107",
  297. "expense_type": "BUSINESS",
  298. "category": "员工福利",
  299. "subcategory": "节日福利",
  300. "invoice_item": "员工节日福利礼品采购",
  301. "seller_profile": "礼品及保健品供应商",
  302. "decision": "BUSINESS",
  303. "risk_level": "LOW",
  304. "decision_reason": [
  305. "礼品为企业统一采购",
  306. "作为员工福利发放",
  307. "非个人自行购买"
  308. ],
  309. "embedding_text": "发票内容为保健品或节日礼品采购费用,虽然商品本身具有个人消费属性,但该费用由企业统一采购并作为员工福利发放,属于企业福利支出,而非个人消费。",
  310. "source": "人工审核确认"
  311. }, {
  312. "case_id": "CASE-BIZ-TRAVEL-108",
  313. "expense_type": "BUSINESS",
  314. "category": "经营支出",
  315. "subcategory": "商务出行",
  316. "invoice_item": "会议及商务出行相关费用",
  317. "seller_profile": "会务 / 差旅服务商",
  318. "decision": "BUSINESS",
  319. "risk_level": "MEDIUM",
  320. "decision_reason": [
  321. "出行目的为商务或会议",
  322. "与企业经营活动直接相关"
  323. ],
  324. "embedding_text": "该发票为会议、商务出行或差旅相关费用,形式上与旅游消费相似,但其出行目的明确为业务活动或会议安排,与企业经营直接相关,因此判定为企业支出。",
  325. "source": "人工审核确认"
  326. }
  327. ]
  328. case_embed_update = [
  329. {
  330. "case_id": "CASE-PER-EDU-012",
  331. "expense_type": "PERSONAL",
  332. "category": "办公用品",
  333. "subcategory": "纸制品",
  334. "invoice_item": "*纸制品*MM 经典卷纸.",
  335. "seller_profile": "山姆会员商店",
  336. "decision": "PERSONAL",
  337. "risk_level": "MEDIUM",
  338. "decision_reason": [
  339. "商品为典型家庭日用消费品",
  340. "交易发生于面向个人会员的仓储式零售商店",
  341. "无批量采购或企业用途标注信息"
  342. ],
  343. "embedding_text": "案例显示,一名员工在山姆会员商店分店开具电子普通发票,购买项目为‘MM 经典卷纸’,金额69.9元。企业财务审核认为该支出属于员工个人生活物资采购,不符合公务报销条件。尽管纸张类物品可能用于办公场景,但结合商户性质和商品类型,未提供额外证明材料时,默认视为个人消费。此案例被多家企业纳入内部风控知识库作为典型示例。",
  344. "source": ""
  345. }
  346. ]