From 4c8def4b049135339d7e181a3073967ed5198af3 Mon Sep 17 00:00:00 2001 From: houhuan Date: Wed, 7 May 2025 19:29:02 +0800 Subject: [PATCH] =?UTF-8?q?=E6=9B=B4=E6=96=B0readme?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- README.md | 40 +++++++++- logs/__main__.log | 8 ++ logs/app.core.excel.converter.log | 42 ++++++++++ logs/app.core.excel.merger.log | 4 + logs/app.core.excel.processor.log | 114 ++++++++++++++++++++++++++++ logs/app.core.ocr.baidu_ocr.log | 1 + logs/app.core.ocr.table_ocr.log | 14 ++++ logs/app.services.ocr_service.log | 5 ++ logs/app.services.order_service.log | 6 ++ 9 files changed, 232 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 5567f8c..d4f0e17 100644 --- a/README.md +++ b/README.md @@ -4,8 +4,8 @@ ## 版本信息 -- **当前版本**: v1.0 -- **发布日期**: 2025-05-02 +- **当前版本**: v1.1 +- **发布日期**: 2025-05-07 - **作者**: OCR订单处理团队 ## 功能特点 @@ -136,6 +136,35 @@ python run.py --merge | 包 | 保持原数量和单位不变 | 3包 → 3包 | | 其他单位 | 保持原数量和单位不变 | 5瓶 → 5瓶 | +### 单位自动推断规则 + +系统能够在缺少单位信息时,根据规格和其他信息自动推断单位: + +1. 当单位为空,并且同时具备以下条件时: + - 有商品编码 + - 有规格信息 + - 有数量信息 + - 有单价信息 + - 规格符合容量*数量格式(如"500ml*15"、"1L*12"等)或简单的数量*数量格式(如"1*12") + + 系统会: + - 自动将单位设置为"件" + - 然后按照件的处理规则进行转换 + + 示例: + - 商品编码: 6954767400129 + - 名称: 美汁源果粒橙1.8L*8瓶 + - 规格: 1.8L*8 + - 数量: 1 + - 单价: 65 + - 单位: (空) + + 处理后: + - 单位被推断为"件" + - 数量: 1 * 8 = 8 + - 单价: 65 / 8 = 8.125 + - 单位: 瓶 + ### 提和盒单位特殊处理 系统对"提"和"盒"单位有特殊的处理逻辑: @@ -224,6 +253,13 @@ MIT License ## 更新日志 +### v1.1 (2025-05-07) + +#### 功能更新 +- 单位自动推断:当单位为空但有商品编码、规格、数量、单价等信息,且规格符合容量*数量格式时,自动将单位设置为"件"并按照件的处理规则进行转换 +- 规格解析优化:改进对容量*数量格式规格的解析,如"1.8L*8"能正确识别包装数量为8 +- 规格提取增强:从商品名称中提取"容量*数量"格式的规格时,能正确识别如"美汁源果粒橙1.8L*8瓶"中的"1.8L*8"部分 + ### v1.0 (2025-05-02) #### 主要功能 diff --git a/logs/__main__.log b/logs/__main__.log index 4422519..eda483d 100644 --- a/logs/__main__.log +++ b/logs/__main__.log @@ -311,3 +311,11 @@ 2025-05-07 18:46:29,610 - __main__ - WARNING - 未找到可处理的Excel文件 2025-05-07 18:47:16,625 - __main__ - INFO - 处理Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507180130.xlsx 2025-05-07 18:47:23,859 - __main__ - INFO - Excel处理成功,输出文件: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507180130.xls +2025-05-07 19:17:08,292 - __main__ - INFO - === 流程步骤 1: OCR识别 === +2025-05-07 19:17:08,293 - __main__ - INFO - 批量处理所有图片 +2025-05-07 19:17:09,737 - __main__ - INFO - OCR处理完成,总计: 1,成功: 1 +2025-05-07 19:17:09,737 - __main__ - INFO - === 流程步骤 2: Excel处理 === +2025-05-07 19:17:09,738 - __main__ - INFO - 处理最新的Excel文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx +2025-05-07 19:17:10,515 - __main__ - ERROR - Excel处理失败 +2025-05-07 19:21:56,953 - __main__ - INFO - 处理Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507191231.xlsx +2025-05-07 19:22:08,043 - __main__ - INFO - Excel处理成功,输出文件: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507191231.xls diff --git a/logs/app.core.excel.converter.log b/logs/app.core.excel.converter.log index 2da3dd4..5fca216 100644 --- a/logs/app.core.excel.converter.log +++ b/logs/app.core.excel.converter.log @@ -1351,3 +1351,45 @@ 2025-05-07 18:47:17,303 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 3.0, 单价: 0.0, 单位: 瓶 2025-05-07 18:47:17,303 - app.core.excel.converter - INFO - 解析容量(L)规格: 500L*12 -> 1*12 2025-05-07 18:47:17,303 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 1.0, 单价: 0.0, 单位: 听 +2025-05-07 19:21:57,610 - app.core.excel.converter - INFO - 解析二级规格: 1*12 -> 1*12 +2025-05-07 19:21:57,610 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 5.0, 单价: 4.5, 单位: 袋 +2025-05-07 19:21:57,611 - app.core.excel.converter - INFO - 解析二级规格: 1*30 -> 1*30 +2025-05-07 19:21:57,611 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 5.0, 单价: 3.75, 单位: 袋 +2025-05-07 19:21:57,612 - app.core.excel.converter - INFO - 解析二级规格: 1*30 -> 1*30 +2025-05-07 19:21:57,614 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 7.0, 单价: 3.75, 单位: 袋 +2025-05-07 19:21:57,615 - app.core.excel.converter - INFO - 解析二级规格: 1*30 -> 1*30 +2025-05-07 19:21:57,618 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 4.0, 单价: 2.8, 单位: 袋 +2025-05-07 19:21:57,619 - app.core.excel.converter - INFO - 解析二级规格: 1*36 -> 1*36 +2025-05-07 19:21:57,619 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 3.0, 单价: 1.9, 单位: 袋 +2025-05-07 19:21:57,620 - app.core.excel.converter - INFO - 解析二级规格: 1*28 -> 1*28 +2025-05-07 19:21:57,620 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 4.0, 单价: 4.4, 单位: 袋 +2025-05-07 19:21:57,662 - app.core.excel.converter - INFO - 解析二级规格: 1*24 -> 1*24 +2025-05-07 19:21:57,663 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 3.0, 单价: 2.7, 单位: 袋 +2025-05-07 19:21:57,667 - app.core.excel.converter - INFO - 提取规格: 麦满天下100g毛毛虫面包(短保) -> 100*None +2025-05-07 19:21:57,668 - app.core.excel.converter - INFO - 从名称推断规格(通用模式): 麦满天下100g毛毛虫面包(短保) -> 100*None +2025-05-07 19:21:57,670 - app.core.excel.converter - WARNING - 无法解析规格: 100*None,使用默认值1*1 +2025-05-07 19:21:57,670 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 2.0, 单价: 3.8, 单位: 袋 +2025-05-07 19:21:57,671 - app.core.excel.converter - INFO - 提取规格: 麦满天下100g肉松卷面包(短保) -> 100*None +2025-05-07 19:21:57,671 - app.core.excel.converter - INFO - 从名称推断规格(通用模式): 麦满天下100g肉松卷面包(短保) -> 100*None +2025-05-07 19:21:57,672 - app.core.excel.converter - WARNING - 无法解析规格: 100*None,使用默认值1*1 +2025-05-07 19:21:57,672 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 2.0, 单价: 3.8, 单位: 袋 +2025-05-07 19:21:57,672 - app.core.excel.converter - INFO - 提取规格: 麦满天下120g黄金蛋皮面包(短保) -> 120*None +2025-05-07 19:21:57,672 - app.core.excel.converter - INFO - 从名称推断规格(通用模式): 麦满天下120g黄金蛋皮面包(短保) -> 120*None +2025-05-07 19:21:57,673 - app.core.excel.converter - WARNING - 无法解析规格: 120*None,使用默认值1*1 +2025-05-07 19:21:57,673 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 2.0, 单价: 3.8, 单位: 袋 +2025-05-07 19:21:57,673 - app.core.excel.converter - INFO - 提取规格: 麦满天下110g脆脆肠面包(短保) -> 110*None +2025-05-07 19:21:57,673 - app.core.excel.converter - INFO - 从名称推断规格(通用模式): 麦满天下110g脆脆肠面包(短保) -> 110*None +2025-05-07 19:21:57,674 - app.core.excel.converter - WARNING - 无法解析规格: 110*None,使用默认值1*1 +2025-05-07 19:21:57,674 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 2.0, 单价: 3.8, 单位: 袋 +2025-05-07 19:21:57,674 - app.core.excel.converter - INFO - 解析二级规格: 1*32 -> 1*32 +2025-05-07 19:21:57,674 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 4.0, 单价: 3.8, 单位: 袋 +2025-05-07 19:22:00,734 - app.core.excel.converter - INFO - 解析二级规格: 1*24 -> 1*24 +2025-05-07 19:22:00,734 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 4.0, 单价: 3.0, 单位: 袋 +2025-05-07 19:22:00,734 - app.core.excel.converter - INFO - 解析二级规格: 1*24 -> 1*24 +2025-05-07 19:22:00,734 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 5.0, 单价: 3.0, 单位: 袋 +2025-05-07 19:22:00,735 - app.core.excel.converter - INFO - 解析二级规格: 1*24 -> 1*24 +2025-05-07 19:22:00,735 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 3.0, 单价: 3.0, 单位: 袋 +2025-05-07 19:22:00,735 - app.core.excel.converter - INFO - 提取规格: 阿尔卑斯(33g21条)12牛奶软条糖(酸奶) -> 33*21 +2025-05-07 19:22:00,735 - app.core.excel.converter - INFO - 从名称推断规格(通用模式): 阿尔卑斯(33g21条)12牛奶软条糖(酸奶) -> 33*21 +2025-05-07 19:22:00,736 - app.core.excel.converter - INFO - 解析二级规格: 33*21 -> 33*21 +2025-05-07 19:22:00,736 - app.core.excel.converter - INFO - 其他单位处理: 保持原样 数量: 21.0, 单价: 1.88, 单位: 条 diff --git a/logs/app.core.excel.merger.log b/logs/app.core.excel.merger.log index d6c5f25..f5749b3 100644 --- a/logs/app.core.excel.merger.log +++ b/logs/app.core.excel.merger.log @@ -441,3 +441,7 @@ 2025-05-07 18:46:29,609 - app.core.excel.merger - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls 2025-05-07 18:47:16,624 - app.core.excel.merger - INFO - 初始化PurchaseOrderMerger 2025-05-07 18:47:16,624 - app.core.excel.merger - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls +2025-05-07 19:17:08,291 - app.core.excel.merger - INFO - 初始化PurchaseOrderMerger +2025-05-07 19:17:08,292 - app.core.excel.merger - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls +2025-05-07 19:21:56,952 - app.core.excel.merger - INFO - 初始化PurchaseOrderMerger +2025-05-07 19:21:56,952 - app.core.excel.merger - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls diff --git a/logs/app.core.excel.processor.log b/logs/app.core.excel.processor.log index 77491b7..ef980c7 100644 --- a/logs/app.core.excel.processor.log +++ b/logs/app.core.excel.processor.log @@ -4087,3 +4087,117 @@ ValueError: could not convert string to float: '2\n96' 2025-05-07 18:47:20,239 - app.core.excel.processor - INFO - 条码 6922467905046 填充:仅有赠品,采购量=0,赠品数量=1.0 2025-05-07 18:47:23,857 - app.core.excel.processor - INFO - 采购单已保存到: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507180130.xls 2025-05-07 18:47:23,859 - app.core.excel.processor - INFO - 采购单已保存到: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507180130.xls +2025-05-07 19:17:08,291 - app.core.excel.processor - INFO - 初始化ExcelProcessor +2025-05-07 19:17:08,291 - app.core.excel.processor - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls +2025-05-07 19:17:09,737 - app.core.excel.processor - INFO - 搜索目录 D:\My Documents\python\orc-order-v2\data\output 中的Excel文件 +2025-05-07 19:17:09,738 - app.core.excel.processor - INFO - 找到最新的Excel文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx +2025-05-07 19:17:09,738 - app.core.excel.processor - INFO - 开始处理Excel文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx +2025-05-07 19:17:10,498 - app.core.excel.processor - INFO - 成功读取Excel文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx, 共 16 行 +2025-05-07 19:17:10,499 - app.core.excel.processor - INFO - 找到可能的表头行: 第1行,评分: 20 +2025-05-07 19:17:10,499 - app.core.excel.processor - INFO - 识别到表头在第 1 行 +2025-05-07 19:17:10,506 - app.core.excel.processor - INFO - 使用表头行重新读取数据,共 15 行有效数据 +2025-05-07 19:17:10,510 - app.core.excel.processor - ERROR - 未找到条码列,无法处理 +2025-05-07 19:17:10,511 - app.core.excel.processor - INFO - 列名映射结果: {} +2025-05-07 19:17:10,512 - app.core.excel.processor - INFO - 是否存在规格列: False +2025-05-07 19:17:10,515 - app.core.excel.processor - INFO - 提取到 0 个商品信息 +2025-05-07 19:17:10,515 - app.core.excel.processor - WARNING - 未提取到有效商品信息 +2025-05-07 19:21:56,951 - app.core.excel.processor - INFO - 初始化ExcelProcessor +2025-05-07 19:21:56,952 - app.core.excel.processor - INFO - 初始化完成,模板文件: templates\银豹-采购单模板.xls +2025-05-07 19:21:56,954 - app.core.excel.processor - INFO - 开始处理Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507191231.xlsx +2025-05-07 19:21:57,556 - app.core.excel.processor - INFO - 成功读取Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507191231.xlsx, 共 17 行 +2025-05-07 19:21:57,558 - app.core.excel.processor - INFO - 找到可能的表头行: 第1行,评分: 35 +2025-05-07 19:21:57,558 - app.core.excel.processor - INFO - 识别到表头在第 1 行 +2025-05-07 19:21:57,604 - app.core.excel.processor - INFO - 使用表头行重新读取数据,共 16 行有效数据 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 找到精确匹配的条码列: 条形码 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 使用条码列: 条形码 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 找到name列(部分匹配): 货品名称 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 找到quantity列: 数量 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 找到unit列: 单位 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 找到price列: 单价 +2025-05-07 19:21:57,605 - app.core.excel.processor - INFO - 列名映射结果: {'barcode': '条形码', 'name': '货品名称', 'quantity': '数量', 'unit': '单位', 'price': '单价'} +2025-05-07 19:21:57,606 - app.core.excel.processor - INFO - 是否存在规格列: False +2025-05-07 19:21:57,607 - app.core.excel.processor - INFO - 第1行: 提取商品信息 条码=6976909150303, 名称=泓一225g*12千层手撕面包(中保), 规格=, 数量=5.0, 单位=袋, 单价=4.5 +2025-05-07 19:21:57,608 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 泓一225g*12千层手撕面包(中保) -> 1*12, 包装数量=12 +2025-05-07 19:21:57,611 - app.core.excel.processor - INFO - 第2行: 提取商品信息 条码=6972052181225, 名称=鲜华食品100g*30艾草糕团(蛋黄肉松味)袋装食滋源, 规格=, 数量=5.0, 单位=袋, 单价=3.75 +2025-05-07 19:21:57,611 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 鲜华食品100g*30艾草糕团(蛋黄肉松味)袋装食滋源 -> 1*30, 包装数量=30 +2025-05-07 19:21:57,612 - app.core.excel.processor - INFO - 第3行: 提取商品信息 条码=6972052181331, 名称=鲜华食品100g*30艾草糕团(红豆蛋黄味)袋装食滋源, 规格=, 数量=7.0, 单位=袋, 单价=3.75 +2025-05-07 19:21:57,612 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 鲜华食品100g*30艾草糕团(红豆蛋黄味)袋装食滋源 -> 1*30, 包装数量=30 +2025-05-07 19:21:57,615 - app.core.excel.processor - INFO - 第4行: 提取商品信息 条码=6911988030177, 名称=美焙辰100g*30红豆起酥面包(短保), 规格=, 数量=4.0, 单位=袋, 单价=2.8 +2025-05-07 19:21:57,615 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰100g*30红豆起酥面包(短保) -> 1*30, 包装数量=30 +2025-05-07 19:21:57,618 - app.core.excel.processor - INFO - 第5行: 提取商品信息 条码=6911988029997, 名称=美焙辰100g*36汤熟全麦吐司面包(短保), 规格=, 数量=3.0, 单位=袋, 单价=1.9 +2025-05-07 19:21:57,619 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰100g*36汤熟全麦吐司面包(短保) -> 1*36, 包装数量=36 +2025-05-07 19:21:57,620 - app.core.excel.processor - INFO - 第6行: 提取商品信息 条码=6911988030061, 名称=美焙辰170g*28薄皮豆沙包(短保), 规格=, 数量=4.0, 单位=袋, 单价=4.4 +2025-05-07 19:21:57,620 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰170g*28薄皮豆沙包(短保) -> 1*28, 包装数量=28 +2025-05-07 19:21:57,621 - app.core.excel.processor - INFO - 第7行: 提取商品信息 条码=6911988031952, 名称=美焙辰85g*24咸松球面包(短保), 规格=, 数量=3.0, 单位=袋, 单价=2.7 +2025-05-07 19:21:57,662 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰85g*24咸松球面包(短保) -> 1*24, 包装数量=24 +2025-05-07 19:21:57,663 - app.core.excel.processor - INFO - 第8行: 提取商品信息 条码=6974640059909, 名称=麦满天下100g毛毛虫面包(短保), 规格=, 数量=2.0, 单位=袋, 单价=3.8 +2025-05-07 19:21:57,670 - app.core.excel.processor - INFO - 从商品名称推断规格: 麦满天下100g毛毛虫面包(短保) -> 100*None, 包装数量=None +2025-05-07 19:21:57,671 - app.core.excel.processor - INFO - 第9行: 提取商品信息 条码=6974640059862, 名称=麦满天下100g肉松卷面包(短保), 规格=, 数量=2.0, 单位=袋, 单价=3.8 +2025-05-07 19:21:57,671 - app.core.excel.processor - INFO - 从商品名称推断规格: 麦满天下100g肉松卷面包(短保) -> 100*None, 包装数量=None +2025-05-07 19:21:57,672 - app.core.excel.processor - INFO - 第10行: 提取商品信息 条码=6974640059022, 名称=麦满天下120g黄金蛋皮面包(短保), 规格=, 数量=2.0, 单位=袋, 单价=3.8 +2025-05-07 19:21:57,672 - app.core.excel.processor - INFO - 从商品名称推断规格: 麦满天下120g黄金蛋皮面包(短保) -> 120*None, 包装数量=None +2025-05-07 19:21:57,673 - app.core.excel.processor - INFO - 第11行: 提取商品信息 条码=6974640059039, 名称=麦满天下110g脆脆肠面包(短保), 规格=, 数量=2.0, 单位=袋, 单价=3.8 +2025-05-07 19:21:57,674 - app.core.excel.processor - INFO - 从商品名称推断规格: 麦满天下110g脆脆肠面包(短保) -> 110*None, 包装数量=None +2025-05-07 19:21:57,674 - app.core.excel.processor - INFO - 第12行: 提取商品信息 条码=6911988033499, 名称=美焙辰120g*32纯蛋糕(原味)(中保), 规格=, 数量=4.0, 单位=袋, 单价=3.8 +2025-05-07 19:21:57,674 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰120g*32纯蛋糕(原味)(中保) -> 1*32, 包装数量=32 +2025-05-07 19:21:57,675 - app.core.excel.processor - INFO - 第13行: 提取商品信息 条码=6911988045744, 名称=美焙辰95g*24大椰蓉面包(中保), 规格=, 数量=4.0, 单位=袋, 单价=3.0 +2025-05-07 19:22:00,734 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰95g*24大椰蓉面包(中保) -> 1*24, 包装数量=24 +2025-05-07 19:22:00,734 - app.core.excel.processor - INFO - 第14行: 提取商品信息 条码=6911988045966, 名称=美焙辰80g*24乳酸椰吉面包(中保), 规格=, 数量=5.0, 单位=袋, 单价=3.0 +2025-05-07 19:22:00,734 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰80g*24乳酸椰吉面包(中保) -> 1*24, 包装数量=24 +2025-05-07 19:22:00,735 - app.core.excel.processor - INFO - 第15行: 提取商品信息 条码=6911988058898, 名称=美焙辰90g*24岩烧大唱盘面包(奶香味)(中保), 规格=, 数量=3.0, 单位=袋, 单价=3.0 +2025-05-07 19:22:00,735 - app.core.excel.processor - INFO - 从商品名称提取重量/容量规格: 美焙辰90g*24岩烧大唱盘面包(奶香味)(中保) -> 1*24, 包装数量=24 +2025-05-07 19:22:00,735 - app.core.excel.processor - INFO - 第16行: 提取商品信息 条码=6911316375307, 名称=阿尔卑斯(33g21条)12牛奶软条糖(酸奶), 规格=, 数量=21.0, 单位=条, 单价=1.88 +2025-05-07 19:22:00,736 - app.core.excel.processor - INFO - 从商品名称推断规格: 阿尔卑斯(33g21条)12牛奶软条糖(酸奶) -> 33*21, 包装数量=21 +2025-05-07 19:22:00,736 - app.core.excel.processor - INFO - 提取到 16 个商品信息 +2025-05-07 19:22:00,742 - app.core.excel.processor - INFO - 开始处理16 个产品信息 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6976909150303, 数量=5.0, 单价=4.5, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6976909150303, 数量=5.0, 单价=4.5 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6972052181225, 数量=5.0, 单价=3.75, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6972052181225, 数量=5.0, 单价=3.75 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6972052181331, 数量=7.0, 单价=3.75, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6972052181331, 数量=7.0, 单价=3.75 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6911988030177, 数量=4.0, 单价=2.8, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6911988030177, 数量=4.0, 单价=2.8 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6911988029997, 数量=3.0, 单价=1.9, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6911988029997, 数量=3.0, 单价=1.9 +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 处理商品: 条码=6911988030061, 数量=4.0, 单价=4.4, 是否赠品=False +2025-05-07 19:22:00,743 - app.core.excel.processor - INFO - 发现正常商品:条码6911988030061, 数量=4.0, 单价=4.4 +2025-05-07 19:22:00,744 - app.core.excel.processor - INFO - 处理商品: 条码=6911988031952, 数量=3.0, 单价=2.7, 是否赠品=False +2025-05-07 19:22:00,744 - app.core.excel.processor - INFO - 发现正常商品:条码6911988031952, 数量=3.0, 单价=2.7 +2025-05-07 19:22:00,744 - app.core.excel.processor - INFO - 处理商品: 条码=6974640059909, 数量=2.0, 单价=3.8, 是否赠品=False +2025-05-07 19:22:04,410 - app.core.excel.processor - INFO - 发现正常商品:条码6974640059909, 数量=2.0, 单价=3.8 +2025-05-07 19:22:04,411 - app.core.excel.processor - INFO - 处理商品: 条码=6974640059862, 数量=2.0, 单价=3.8, 是否赠品=False +2025-05-07 19:22:04,411 - app.core.excel.processor - INFO - 发现正常商品:条码6974640059862, 数量=2.0, 单价=3.8 +2025-05-07 19:22:04,411 - app.core.excel.processor - INFO - 处理商品: 条码=6974640059022, 数量=2.0, 单价=3.8, 是否赠品=False +2025-05-07 19:22:04,412 - app.core.excel.processor - INFO - 发现正常商品:条码6974640059022, 数量=2.0, 单价=3.8 +2025-05-07 19:22:04,412 - app.core.excel.processor - INFO - 处理商品: 条码=6974640059039, 数量=2.0, 单价=3.8, 是否赠品=False +2025-05-07 19:22:04,412 - app.core.excel.processor - INFO - 发现正常商品:条码6974640059039, 数量=2.0, 单价=3.8 +2025-05-07 19:22:04,412 - app.core.excel.processor - INFO - 处理商品: 条码=6911988033499, 数量=4.0, 单价=3.8, 是否赠品=False +2025-05-07 19:22:04,412 - app.core.excel.processor - INFO - 发现正常商品:条码6911988033499, 数量=4.0, 单价=3.8 +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 处理商品: 条码=6911988045744, 数量=4.0, 单价=3.0, 是否赠品=False +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 发现正常商品:条码6911988045744, 数量=4.0, 单价=3.0 +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 处理商品: 条码=6911988045966, 数量=5.0, 单价=3.0, 是否赠品=False +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 发现正常商品:条码6911988045966, 数量=5.0, 单价=3.0 +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 处理商品: 条码=6911988058898, 数量=3.0, 单价=3.0, 是否赠品=False +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 发现正常商品:条码6911988058898, 数量=3.0, 单价=3.0 +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 处理商品: 条码=6911316375307, 数量=21.0, 单价=1.88, 是否赠品=False +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 发现正常商品:条码6911316375307, 数量=21.0, 单价=1.88 +2025-05-07 19:22:04,413 - app.core.excel.processor - INFO - 分组后共16 个不同条码的商品 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6976909150303 处理结果:正常商品数量5.0,单价4.5,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6972052181225 处理结果:正常商品数量5.0,单价3.75,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6972052181331 处理结果:正常商品数量7.0,单价3.75,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6911988030177 处理结果:正常商品数量4.0,单价2.8,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6911988029997 处理结果:正常商品数量3.0,单价1.9,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6911988030061 处理结果:正常商品数量4.0,单价4.4,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6911988031952 处理结果:正常商品数量3.0,单价2.7,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6974640059909 处理结果:正常商品数量2.0,单价3.8,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6974640059862 处理结果:正常商品数量2.0,单价3.8,赠品数量0 +2025-05-07 19:22:04,414 - app.core.excel.processor - INFO - 条码 6974640059022 处理结果:正常商品数量2.0,单价3.8,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6974640059039 处理结果:正常商品数量2.0,单价3.8,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6911988033499 处理结果:正常商品数量4.0,单价3.8,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6911988045744 处理结果:正常商品数量4.0,单价3.0,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6911988045966 处理结果:正常商品数量5.0,单价3.0,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6911988058898 处理结果:正常商品数量3.0,单价3.0,赠品数量0 +2025-05-07 19:22:04,415 - app.core.excel.processor - INFO - 条码 6911316375307 处理结果:正常商品数量21.0,单价1.88,赠品数量0 +2025-05-07 19:22:08,041 - app.core.excel.processor - INFO - 采购单已保存到: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507191231.xls +2025-05-07 19:22:08,043 - app.core.excel.processor - INFO - 采购单已保存到: D:\My Documents\python\orc-order-v2\data\output\采购单_微信图片_20250507191231.xls diff --git a/logs/app.core.ocr.baidu_ocr.log b/logs/app.core.ocr.baidu_ocr.log index d15903a..c580941 100644 --- a/logs/app.core.ocr.baidu_ocr.log +++ b/logs/app.core.ocr.baidu_ocr.log @@ -60,3 +60,4 @@ 2025-05-05 22:22:22,618 - app.core.ocr.baidu_ocr - ERROR - 百度OCR API错误: recognize error 2025-05-06 20:39:59,192 - app.core.ocr.baidu_ocr - INFO - 成功获取访问令牌 2025-05-07 18:01:37,558 - app.core.ocr.baidu_ocr - INFO - 成功获取访问令牌 +2025-05-07 19:17:08,701 - app.core.ocr.baidu_ocr - INFO - 成功获取访问令牌 diff --git a/logs/app.core.ocr.table_ocr.log b/logs/app.core.ocr.table_ocr.log index df71962..3aedd55 100644 --- a/logs/app.core.ocr.table_ocr.log +++ b/logs/app.core.ocr.table_ocr.log @@ -535,3 +535,17 @@ 2025-05-07 18:47:16,622 - app.core.ocr.table_ocr - INFO - 使用输出目录: D:\My Documents\python\orc-order-v2\data\output 2025-05-07 18:47:16,622 - app.core.ocr.table_ocr - INFO - 使用临时目录: D:\My Documents\python\orc-order-v2\data\temp 2025-05-07 18:47:16,623 - app.core.ocr.table_ocr - INFO - OCR处理器初始化完成,输入目录: D:\My Documents\python\orc-order-v2\data\input, 输出目录: D:\My Documents\python\orc-order-v2\data\output +2025-05-07 19:17:08,290 - app.core.ocr.table_ocr - INFO - 使用输入目录: D:\My Documents\python\orc-order-v2\data\input +2025-05-07 19:17:08,290 - app.core.ocr.table_ocr - INFO - 使用输出目录: D:\My Documents\python\orc-order-v2\data\output +2025-05-07 19:17:08,290 - app.core.ocr.table_ocr - INFO - 使用临时目录: D:\My Documents\python\orc-order-v2\data\temp +2025-05-07 19:17:08,290 - app.core.ocr.table_ocr - INFO - OCR处理器初始化完成,输入目录: D:\My Documents\python\orc-order-v2\data\input, 输出目录: D:\My Documents\python\orc-order-v2\data\output +2025-05-07 19:17:08,293 - app.core.ocr.table_ocr - INFO - 找到 1 个图片文件,其中 1 个未处理 +2025-05-07 19:17:08,293 - app.core.ocr.table_ocr - INFO - 处理批次 1/1, 大小: 1 +2025-05-07 19:17:08,296 - app.core.ocr.table_ocr - INFO - 开始处理图片: D:\My Documents\python\orc-order-v2\data\input\微信图片_20250507191231.jpg +2025-05-07 19:17:09,733 - app.core.ocr.table_ocr - INFO - 图片处理成功: D:\My Documents\python\orc-order-v2\data\input\微信图片_20250507191231.jpg, 输出文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx +2025-05-07 19:17:09,736 - app.core.ocr.table_ocr - INFO - 批次处理完成, 成功: 1/1 +2025-05-07 19:17:09,736 - app.core.ocr.table_ocr - INFO - 所有图片处理完成, 总计: 1, 成功: 1 +2025-05-07 19:21:56,949 - app.core.ocr.table_ocr - INFO - 使用输入目录: D:\My Documents\python\orc-order-v2\data\input +2025-05-07 19:21:56,949 - app.core.ocr.table_ocr - INFO - 使用输出目录: D:\My Documents\python\orc-order-v2\data\output +2025-05-07 19:21:56,949 - app.core.ocr.table_ocr - INFO - 使用临时目录: D:\My Documents\python\orc-order-v2\data\temp +2025-05-07 19:21:56,950 - app.core.ocr.table_ocr - INFO - OCR处理器初始化完成,输入目录: D:\My Documents\python\orc-order-v2\data\input, 输出目录: D:\My Documents\python\orc-order-v2\data\output diff --git a/logs/app.services.ocr_service.log b/logs/app.services.ocr_service.log index 8661246..c7df805 100644 --- a/logs/app.services.ocr_service.log +++ b/logs/app.services.ocr_service.log @@ -220,3 +220,8 @@ 2025-05-07 18:46:29,607 - app.services.ocr_service - INFO - OCRService初始化完成 2025-05-07 18:47:16,621 - app.services.ocr_service - INFO - 初始化OCRService 2025-05-07 18:47:16,623 - app.services.ocr_service - INFO - OCRService初始化完成 +2025-05-07 19:17:08,288 - app.services.ocr_service - INFO - 初始化OCRService +2025-05-07 19:17:08,290 - app.services.ocr_service - INFO - OCRService初始化完成 +2025-05-07 19:17:08,293 - app.services.ocr_service - INFO - OCRService开始批量处理图片, batch_size=None, max_workers=None +2025-05-07 19:21:56,948 - app.services.ocr_service - INFO - 初始化OCRService +2025-05-07 19:21:56,950 - app.services.ocr_service - INFO - OCRService初始化完成 diff --git a/logs/app.services.order_service.log b/logs/app.services.order_service.log index d1253dc..9dce94d 100644 --- a/logs/app.services.order_service.log +++ b/logs/app.services.order_service.log @@ -251,3 +251,9 @@ 2025-05-07 18:47:16,623 - app.services.order_service - INFO - 初始化OrderService 2025-05-07 18:47:16,625 - app.services.order_service - INFO - OrderService初始化完成 2025-05-07 18:47:16,625 - app.services.order_service - INFO - OrderService开始处理指定Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507180130.xlsx +2025-05-07 19:17:08,290 - app.services.order_service - INFO - 初始化OrderService +2025-05-07 19:17:08,292 - app.services.order_service - INFO - OrderService初始化完成 +2025-05-07 19:17:09,738 - app.services.order_service - INFO - OrderService开始处理指定Excel文件: D:\My Documents\python\orc-order-v2\data\output\微信图片_20250507191231.xlsx +2025-05-07 19:21:56,950 - app.services.order_service - INFO - 初始化OrderService +2025-05-07 19:21:56,953 - app.services.order_service - INFO - OrderService初始化完成 +2025-05-07 19:21:56,954 - app.services.order_service - INFO - OrderService开始处理指定Excel文件: D:/My Documents/python/orc-order-v2/data/output/微信图片_20250507191231.xlsx