RhSolutions-AddIn/RhSolutions.AddIn/Services/YandexOcrClient.cs

70 lines
2.1 KiB
C#
Raw Normal View History

2024-11-13 23:42:28 +03:00
using System.Net.Http;
using System.Net.Http.Headers;
using System.Text;
2024-11-14 00:16:58 +03:00
using System.Threading.Tasks;
2024-11-13 23:42:28 +03:00
using Newtonsoft.Json;
2024-11-14 00:16:58 +03:00
namespace RhSolutions.Services;
2024-11-13 23:42:28 +03:00
public class YandexOcrClient : IOcrClient
{
private readonly HttpClient _httpClient;
public YandexOcrClient(HttpClient httpClient)
{
_httpClient = httpClient;
_httpClient.BaseAddress = new Uri("https://ocr.api.cloud.yandex.net/ocr/v1/");
}
public async Task<IEnumerable<object[,]>> ProcessImage(string base64Image, string xFolderId, string apiKey)
{
using StringContent jsonContent = new(
JsonConvert.SerializeObject(new
{
mimeType = "PNG",
languageCodes = new string[] { "ru", "en" },
model = "table",
content = base64Image
}),
Encoding.UTF8,
"application/json");
_httpClient.DefaultRequestHeaders.Authorization = new AuthenticationHeaderValue("Api-Key", apiKey);
_httpClient.DefaultRequestHeaders.Add("x-folder-id", xFolderId);
_httpClient.DefaultRequestHeaders.Add("x-data-logging-enable", "true");
using HttpResponseMessage response = await _httpClient.PostAsync("recognizeText", jsonContent);
response.EnsureSuccessStatusCode();
string jsonResponse = await response.Content.ReadAsStringAsync();
2024-11-14 00:16:58 +03:00
OcrResponse deserialized = JsonConvert.DeserializeObject<OcrResponse>(jsonResponse);
2024-11-13 23:42:28 +03:00
if (deserialized != null)
{
var tables = deserialized?.Result?.TextAnnotation?.Tables ?? Enumerable.Empty<Table>();
if (tables.Any())
{
List<object[,]> result = new();
foreach (var table in tables)
{
if (table.Cells == null || table.Cells.Count == 0)
{
continue;
}
int columnCount = int.Parse(table.ColumnCount);
int rowCount = int.Parse(table.RowCount);
object[,] cells = new object[rowCount, columnCount];
foreach (Cell cell in table.Cells)
{
int rowIndex = int.Parse(cell.RowIndex);
int columnIndex = int.Parse(cell.ColumnIndex);
cells[rowIndex, columnIndex] = double.TryParse(cell.Text, out double v) ?
v : cell.Text ?? string.Empty;
}
result.Add(cells);
}
return result;
}
}
2024-11-13 23:43:27 +03:00
return Enumerable.Empty<object[,]>();
2024-11-13 23:42:28 +03:00
}
}