Browse Source

ocr接口文档下载

leiy 9 months ago
parent
commit
599f704ef2

+ 176 - 15
OASystem/OASystem.Api/Controllers/TencentOCRController.cs

@@ -1,15 +1,22 @@
 using Aspose.Cells;
+using Aspose.Words;
+using Microsoft.AspNetCore.Mvc.ViewEngines;
+using NPOI.HPSF;
 using OASystem.API.OAMethodLib.File;
 //using OASystem.API.OAMethodLib.NPOI;
 using OASystem.API.OAMethodLib.TencentCloudAPI;
 using OASystem.API.OAMethodLib.YouDaoAPI;
 using OASystem.Domain.Dtos.CRM;
+using OASystem.Domain.Dtos.QiYeWeChat;
 using OASystem.Domain.Dtos.Tencent;
+using OASystem.Domain.ViewModels.OCR;
 using OASystem.Domain.ViewModels.TencentOCR;
 using OASystem.Infrastructure.Repositories.CRM;
 using Org.BouncyCastle.Crypto;
 using Org.BouncyCastle.Utilities.Encoders;
 using StackExchange.Redis;
+using System.Collections.Generic;
+using System.Data;
 using System.Net.NetworkInformation;
 using TencentCloud.Ocr.V20181119.Models;
 using Ubiety.Dns.Core;
@@ -34,6 +41,7 @@ namespace OASystem.API.Controllers
 
         /// <summary>
         /// 通用印刷体
+        /// 文档下载
         /// </summary>
         /// <param name="dto"></param>
         /// <returns></returns>
@@ -54,7 +62,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var gbData =  TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
+            var gbData = await TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
 
             if (gbData.Code != 0)
             {
@@ -66,13 +74,42 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView(gbData.Msg));
             }
 
-            return Ok(JsonView(gbData.Data));
+            #region word下载
+
+            GeneralBasicOCRResponse res = gbData.Data as GeneralBasicOCRResponse;
+
+            Document doc = new Document();
+            DocumentBuilder builder = new DocumentBuilder(doc);
+            string fileName = "通用印刷体";
+            string content = $"{fileName}\r\n\r\n";
+            foreach (var view in res.TextDetections)
+            {
+                content += $"Content:{view.DetectedText}\r\n\r\n";
+            }
+
+            builder.Write(content);
+
+            string outputDir = $"{AppSettingsHelper.Get("WordBasePath")}/TencentOCR";
+            string outputFile = $"{fileName}{DateTime.Now.ToString("yyyyMMddHHmmss")}.docx";
+            string outputPath = Path.Combine(outputDir, outputFile);
+
+            if (!Directory.Exists(outputDir))
+            {
+                Directory.CreateDirectory(outputDir);
+            }
+
+            doc.Save(outputPath);
+            string url = $"{AppSettingsHelper.Get("WordBaseUrl")}Office/Word/TencentOCR/{outputFile}";
+
+            #endregion
+
+            return Ok(JsonView(true, "操作成功", new { dataSource = res, url = url }));
         }
 
 
         /// <summary>
         /// 身份证识别(国徽面/反面)
-        /// 获取身份证返回数据
+        /// 文档下载
         /// </summary>
         /// <param name="dto"></param>
         /// <returns></returns>
@@ -93,7 +130,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var idCardData = TencentOCRTools.GetOCR((int)TencentOCREnum.IDCard, dto);
+            var idCardData =await TencentOCRTools.GetOCR((int)TencentOCREnum.IDCard, dto);
 
             if (idCardData.Code != 0)
             {
@@ -174,7 +211,7 @@ namespace OASystem.API.Controllers
 
         /// <summary>
         /// 户口簿识别
-        /// 获取户口簿返回数据 
+        ///  文档下载 
         /// </summary>
         /// <param name="dto"></param>
         /// <returns></returns>
@@ -188,7 +225,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var residenceBookData = TencentOCRTools.GetOCR((int)TencentOCREnum.ResidenceBooklet, dto);
+            var residenceBookData = await TencentOCRTools.GetOCR((int)TencentOCREnum.ResidenceBooklet, dto);
 
             if (residenceBookData.Code != 0)
             {
@@ -200,6 +237,51 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView(residenceBookData.Msg));
             }
 
+            #region Feil Down
+
+            BizLicenseOCRResponse res = residenceBookData.Data as BizLicenseOCRResponse;
+
+            Document doc = new Document();
+            DocumentBuilder builder = new DocumentBuilder(doc);
+
+            string fileName = "户口簿识别";
+            string content = $"{fileName}\r\n\r\n";
+
+            if (res != null)
+            {
+                content += $"公司名称:{res.Name}\r\n\r\n";
+                content += $"统一社会信用代码(三合一之前为注册号):{res.RegNum}\r\n\r\n";
+                content += $"注册资本:{res.Capital}\r\n\r\n";
+                content += $"法人代表:{res.Person}\r\n\r\n";
+                content += $"地址:{res.Address}\r\n\r\n";
+                content += $"经营范围:{res.Business}\r\n\r\n";
+                content += $"主题类型:{res.Type}\r\n\r\n";
+                content += $"营业期限:{res.Period}\r\n\r\n";
+                content += $"组成形式:{res.ComposingForm}\r\n\r\n";
+                content += $"成立日期:{res.SetDate}\r\n\r\n";
+            }
+
+            
+
+            builder.Write(content);
+
+            string outputDir = $"{AppSettingsHelper.Get("WordBasePath")}/TencentOCR";
+            string outputFile = $"{fileName}{DateTime.Now.ToString("yyyyMMddHHmmss")}.docx";
+            string outputPath = Path.Combine(outputDir, outputFile);
+
+            if (!Directory.Exists(outputDir))
+            {
+                Directory.CreateDirectory(outputDir);
+            }
+
+            doc.Save(outputPath);
+
+
+
+            return $"{AppSettingsHelper.Get("WordBaseUrl")}Office/Word/TencentOCR/{outputFile}";
+
+            #endregion
+
 
             return Ok(JsonView(residenceBookData.Data));
         }
@@ -220,7 +302,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var residenceBookData = TencentOCRTools.GetOCR((int)TencentOCREnum.BizLicense, dto);
+            var residenceBookData = await TencentOCRTools.GetOCR((int)TencentOCREnum.BizLicense, dto);
 
             if (residenceBookData.Code != 0)
             {
@@ -252,7 +334,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var occData = TencentOCRTools.GetOCR((int)TencentOCREnum.OrgCodeCert, dto);
+            var occData = await TencentOCRTools.GetOCR((int)TencentOCREnum.OrgCodeCert, dto);
 
             if (occData.Code != 0)
             {
@@ -284,7 +366,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var vehicleLicenseData = TencentOCRTools.GetOCR((int)TencentOCREnum.VehicleLicense, dto);
+            var vehicleLicenseData = await TencentOCRTools.GetOCR((int)TencentOCREnum.VehicleLicense, dto);
 
             if (vehicleLicenseData.Code != 0)
             {
@@ -315,7 +397,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var pcData = TencentOCRTools.GetOCR((int)TencentOCREnum.PropOwnerCert, dto);
+            var pcData = await TencentOCRTools.GetOCR((int)TencentOCREnum.PropOwnerCert, dto);
 
             if (pcData.Code != 0)
             {
@@ -346,7 +428,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var mlData = TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
+            var mlData = await TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
 
             if (mlData.Code != 0)
             {
@@ -377,7 +459,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var gbData = TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
+            var gbData = await TencentOCRTools.GetOCR((int)TencentOCREnum.GeneralBasic, dto);
 
             if (gbData.Code != 0)
             {
@@ -408,7 +490,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var pData = TencentOCRTools.GetOCR((int)TencentOCREnum.Passport, dto);
+            var pData = await TencentOCRTools.GetOCR((int)TencentOCREnum.Passport, dto);
 
             if (pData.Code != 0)
             {
@@ -439,7 +521,7 @@ namespace OASystem.API.Controllers
                 return Ok(JsonView("图片不能大于7M!"));
             }
 
-            var mlidpData = TencentOCRTools.GetOCR((int)TencentOCREnum.MLIDPassport, dto);
+            var mlidpData = await TencentOCRTools.GetOCR((int)TencentOCREnum.MLIDPassport, dto);
 
             if (mlidpData.Code != 0)
             {
@@ -472,7 +554,7 @@ namespace OASystem.API.Controllers
 
             try
             {
-                var mlidpData = TencentOCRTools.GetOCR((int)TencentOCREnum.BusinessCard, dto);
+                var mlidpData = await TencentOCRTools.GetOCR((int)TencentOCREnum.BusinessCard, dto);
                 if (mlidpData.Code != 0)
                 {
                     return Ok(JsonView(mlidpData.Msg));
@@ -491,6 +573,85 @@ namespace OASystem.API.Controllers
             }
         }
 
+        /// <summary>
+        /// 智能结构化识别V2
+        /// 获取名片 返回数据 
+        /// </summary>
+        /// <param name="dto"></param>
+        /// <returns></returns>
+        [HttpPost]
+        [ProducesResponseType(typeof(JsonView), StatusCodes.Status200OK)]
+        public async Task<IActionResult> GetSmartStructuralOCRV2(BusinessCardOCRDto dto)
+        {
+            string[] picBase64Array = dto.picBase64.Split(';');
+            string picFormat = picBase64Array[0].Split('/')[1];
+            if (!TencentOCRTools.ImageType(picFormat))
+            {
+                return Ok(JsonView("图片格式不正确!只支持 PNG、JPG、JPEG、BMP 格式!"));
+            }
+
+            double strSize = 1024 * 1024 * 7;
+            if (dto.picBase64.Length > strSize)
+            {
+                return Ok(JsonView("图片不能大于7M!"));
+            }
+
+           
+            var ssData = await TencentOCRTools.GetOCR((int)TencentOCREnum.SmartStructuralOCRV2, dto);
+            if (ssData.Code != 0)
+            {
+                return Ok(JsonView(false, ssData.Msg));
+            }
+
+            if (ssData.Data == null)
+            {
+                return Ok(JsonView(false, ssData.Msg));
+            }
+
+            //var wordRes =  GenerateWord(ssData.Data as List<ocrGeneralView>, "智能结构化识别V2");
+            List<ocrGeneralView>? datas = ssData.Data as List<ocrGeneralView>;
+
+            var data = new { 
+                dataSource = ssData.Data,
+                url = GenerateWord(datas, "智能结构化识别V2")
+            };
+            return Ok(JsonView(true, ssData.Msg, data));
+           
+        }
+
+
+        /// <summary>
+        /// 生成 ocr word
+        /// </summary>
+        /// <param name="views"></param>
+        /// <param name="fileName"></param>
+        /// <returns></returns>
+        private string GenerateWord(List<ocrGeneralView> views, string fileName)
+        {
+            Document doc = new Document();
+            DocumentBuilder builder = new DocumentBuilder(doc);
+
+            string content = $"{fileName}\r\n\r\n";
+            foreach (var view in views)
+            {
+                content += $"TypeName:{view.name}\t\r\nContent:{view.value}\r\n\r\n";
+            }
+
+            builder.Write(content);
+
+            string outputDir = $"{AppSettingsHelper.Get("WordBasePath")}/TencentOCR";
+            string outputFile = $"{fileName}{DateTime.Now.ToString("yyyyMMddHHmmss")}.docx";
+            string outputPath = Path.Combine(outputDir, outputFile);
+
+            if (!Directory.Exists(outputDir))
+            {
+                Directory.CreateDirectory(outputDir);
+            }
+
+            doc.Save(outputPath);
+
+            return $"{AppSettingsHelper.Get("WordBaseUrl")}Office/Word/TencentOCR/{outputFile}";
+        }
         #endregion
 
         #region android ios

+ 7 - 0
OASystem/OASystem.Api/OAMethodLib/File/AsposeHelper.cs

@@ -43,6 +43,13 @@ namespace OASystem.API.OAMethodLib.File
                 }
 
                 string tempPath = string.Format("{0}/Word/Template/{1}", AppSettingsHelper.Get("OfficeTempBasePath"), tempFileName);
+
+                //// 将文本编码为字节序列
+                //byte[] encodedBytes = Encoding.UTF8.GetBytes(tempPath);
+
+                //// 解码字节序列为文本
+                //tempPath = Encoding.UTF8.GetString(encodedBytes);
+                
                 //载入模板
                 Document doc = new Document(tempPath);
                 doc.MailMerge.Execute(fieldNames.ToArray(), fieldValues.ToArray());

+ 25 - 1
OASystem/OASystem.Api/OAMethodLib/TencentCloudAPI/TencentOCRTools.cs

@@ -3,6 +3,8 @@ using TencentCloud.Common;
 using TencentCloud.Ocr.V20181119.Models;
 using TencentCloud.Ocr.V20181119;
 using OASystem.Domain.ViewModels.OCR;
+using Aspose.Words;
+using NPOI.SS.Formula.Functions;
 
 namespace OASystem.API.OAMethodLib.TencentCloudAPI
 {
@@ -26,7 +28,7 @@ namespace OASystem.API.OAMethodLib.TencentCloudAPI
         /// <param name="ocrEnum">转换类型</param>
         /// <param name="data">请求数据源</param>
         /// <returns></returns>
-        public static Result GetOCR(int ocrEnum, object data)
+        public static async Task<Result> GetOCR(int ocrEnum, object data)
         {
             Result result = new Result { Code = -1, Msg = "未知错误", Data = null };
             OcrClient client = new OcrClient(cred, "ap-guangzhou");
@@ -117,6 +119,25 @@ namespace OASystem.API.OAMethodLib.TencentCloudAPI
                         BusinessCardOCRResponse bcRep = client.BusinessCardOCRSync(bcReq);
                         result.Data = bcRep;
                         break;
+                    case 10: // 智能结构化识别V2
+                        //SmartStructuralOCRV2
+                        BusinessCardOCRDto ssOCR = (BusinessCardOCRDto)data;
+                        SmartStructuralOCRRequest ssReq = new SmartStructuralOCRRequest()
+                        {
+                            ImageBase64 = ssOCR.picBase64,
+                            IsPdf = true,
+                            ReturnFullText = true
+                        };
+
+                        SmartStructuralOCRResponse ssRep = client.SmartStructuralOCRSync(ssReq);
+                         List<StructuralItem> structuralItems = ssRep.StructuralItems.ToList();
+                        if (structuralItems.Count() < 1 )
+                        {
+                            return new Result() { Code = -1, Msg = "智能结构化识别V2:未识别出可用信息" };
+                        }
+                        List<ocrGeneralView> _views = structuralItems.Select(it => new ocrGeneralView() { name = it.Name, value = it.Value }).ToList();
+                        result.Data = _views;
+                        break;
                 }
 
                 result.Code = 0;
@@ -298,5 +319,8 @@ namespace OASystem.API.OAMethodLib.TencentCloudAPI
                 return Math.Round(size / TBCount, roundCount) + "TB";
             }
         }
+
+        
+
     }
 }

+ 5 - 1
OASystem/OASystem.Domain/Enums/TencentOCREnum.cs

@@ -61,6 +61,10 @@ namespace OASystem.Domain.Enums
         /// <summary>
         /// 名片识别
         /// </summary>
-        BusinessCard
+        BusinessCard,
+        /// <summary>
+        /// 智能结构化识别V2
+        /// </summary>
+        SmartStructuralOCRV2
     }
 }

+ 18 - 0
OASystem/OASystem.Domain/ViewModels/OCR/OCRAppView.cs

@@ -48,4 +48,22 @@ namespace OASystem.Domain.ViewModels.OCR
 
     }
 
+    /// <summary>
+    /// ocr 通用视图
+    /// </summary>
+    public class ocrGeneralView
+    {
+        /// <summary>
+        /// 类型名称
+        /// </summary>
+        public string name { get; set; }
+
+        /// <summary>
+        /// 类型值
+        /// </summary>
+        public string value { get; set; }
+
+
+    }
+
 }