|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#include <stdio.h> |
|
|
#include <stdlib.h> |
|
|
#include <string.h> |
|
|
#include <windows.h> |
|
|
|
|
|
|
|
|
typedef long long (*fn_CreateOcrInitOptions)(long long*); |
|
|
typedef long long (*fn_OcrInitOptionsSetUseModelDelayLoad)(long long, char); |
|
|
typedef long long (*fn_CreateOcrPipeline)(const char*, const char*, long long, long long*); |
|
|
typedef long long (*fn_CreateOcrProcessOptions)(long long*); |
|
|
typedef long long (*fn_OcrProcessOptionsSetMaxRecognitionLineCount)(long long, long long); |
|
|
typedef long long (*fn_RunOcrPipeline)(long long, void*, long long, long long*); |
|
|
typedef long long (*fn_GetImageAngle)(long long, float*); |
|
|
typedef long long (*fn_GetOcrLineCount)(long long, long long*); |
|
|
typedef long long (*fn_GetOcrLine)(long long, long long, long long*); |
|
|
typedef long long (*fn_GetOcrLineContent)(long long, const char**); |
|
|
typedef long long (*fn_GetOcrLineBoundingBox)(long long, void**); |
|
|
typedef long long (*fn_GetOcrLineWordCount)(long long, long long*); |
|
|
typedef long long (*fn_GetOcrWord)(long long, long long, long long*); |
|
|
typedef long long (*fn_GetOcrWordContent)(long long, const char**); |
|
|
typedef long long (*fn_GetOcrWordBoundingBox)(long long, void**); |
|
|
typedef long long (*fn_GetOcrWordConfidence)(long long, float*); |
|
|
typedef void (*fn_ReleaseOcrResult)(long long); |
|
|
typedef void (*fn_ReleaseOcrInitOptions)(long long); |
|
|
typedef void (*fn_ReleaseOcrPipeline)(long long); |
|
|
typedef void (*fn_ReleaseOcrProcessOptions)(long long); |
|
|
|
|
|
#pragma pack(push, 1) |
|
|
typedef struct { |
|
|
int type; |
|
|
int width; |
|
|
int height; |
|
|
int reserved; |
|
|
long long step; |
|
|
unsigned char *data; |
|
|
} ImageStruct; |
|
|
|
|
|
typedef struct { |
|
|
float x1, y1, x2, y2, x3, y3, x4, y4; |
|
|
} BBox; |
|
|
#pragma pack(pop) |
|
|
|
|
|
|
|
|
static unsigned char* load_bmp_bgra(const char* path, int* w, int* h) { |
|
|
FILE* f = fopen(path, "rb"); |
|
|
if (!f) return NULL; |
|
|
|
|
|
unsigned char header[54]; |
|
|
fread(header, 1, 54, f); |
|
|
|
|
|
*w = *(int*)(header + 18); |
|
|
*h = *(int*)(header + 22); |
|
|
int bpp = *(short*)(header + 28); |
|
|
int offset = *(int*)(header + 10); |
|
|
int abs_h = *h < 0 ? -*h : *h; |
|
|
|
|
|
fseek(f, offset, SEEK_SET); |
|
|
|
|
|
|
|
|
unsigned char* bgra = (unsigned char*)malloc((*w) * abs_h * 4); |
|
|
|
|
|
if (bpp == 24) { |
|
|
int row_size = ((*w * 3 + 3) & ~3); |
|
|
unsigned char* row = (unsigned char*)malloc(row_size); |
|
|
for (int y = 0; y < abs_h; y++) { |
|
|
int dest_y = (*h > 0) ? (abs_h - 1 - y) : y; |
|
|
fread(row, 1, row_size, f); |
|
|
for (int x = 0; x < *w; x++) { |
|
|
bgra[(dest_y * *w + x) * 4 + 0] = row[x * 3 + 0]; |
|
|
bgra[(dest_y * *w + x) * 4 + 1] = row[x * 3 + 1]; |
|
|
bgra[(dest_y * *w + x) * 4 + 2] = row[x * 3 + 2]; |
|
|
bgra[(dest_y * *w + x) * 4 + 3] = 255; |
|
|
} |
|
|
} |
|
|
free(row); |
|
|
} else if (bpp == 32) { |
|
|
for (int y = 0; y < abs_h; y++) { |
|
|
int dest_y = (*h > 0) ? (abs_h - 1 - y) : y; |
|
|
fread(bgra + dest_y * *w * 4, 1, *w * 4, f); |
|
|
} |
|
|
} |
|
|
|
|
|
*h = abs_h; |
|
|
fclose(f); |
|
|
return bgra; |
|
|
} |
|
|
|
|
|
|
|
|
static void json_escape(const char* s, char* out, int max) { |
|
|
int j = 0; |
|
|
out[j++] = '"'; |
|
|
for (int i = 0; s[i] && j < max - 3; i++) { |
|
|
if (s[i] == '"') { out[j++] = '\\'; out[j++] = '"'; } |
|
|
else if (s[i] == '\\') { out[j++] = '\\'; out[j++] = '\\'; } |
|
|
else if (s[i] == '\n') { out[j++] = '\\'; out[j++] = 'n'; } |
|
|
else if (s[i] == '\r') { out[j++] = '\\'; out[j++] = 'r'; } |
|
|
else if (s[i] == '\t') { out[j++] = '\\'; out[j++] = 't'; } |
|
|
else out[j++] = s[i]; |
|
|
} |
|
|
out[j++] = '"'; |
|
|
out[j] = 0; |
|
|
} |
|
|
|
|
|
int main(int argc, char** argv) { |
|
|
if (argc < 4) { |
|
|
fprintf(stderr, "Usage: %s <dll_dir> <image.bmp> <model_key_hex>\n", argv[0]); |
|
|
return 1; |
|
|
} |
|
|
|
|
|
const char* dll_dir = argv[1]; |
|
|
const char* img_path = argv[2]; |
|
|
const char* key_hex = argv[3]; |
|
|
|
|
|
|
|
|
SetDllDirectoryA(dll_dir); |
|
|
char old_path[32768]; |
|
|
GetEnvironmentVariableA("PATH", old_path, sizeof(old_path)); |
|
|
char new_path[32768]; |
|
|
snprintf(new_path, sizeof(new_path), "%s;%s", dll_dir, old_path); |
|
|
SetEnvironmentVariableA("PATH", new_path); |
|
|
|
|
|
|
|
|
char dll_path[MAX_PATH]; |
|
|
snprintf(dll_path, sizeof(dll_path), "%s\\oneocr.dll", dll_dir); |
|
|
|
|
|
HMODULE hmod = LoadLibraryA(dll_path); |
|
|
if (!hmod) { |
|
|
fprintf(stderr, "{\"error\": \"LoadLibrary failed: %lu\"}\n", GetLastError()); |
|
|
return 1; |
|
|
} |
|
|
|
|
|
|
|
|
#define GETFN(name) fn_##name p##name = (fn_##name)GetProcAddress(hmod, #name); \ |
|
|
if (!p##name) { fprintf(stderr, "{\"error\": \"GetProcAddress(%s) failed\"}\n", #name); return 1; } |
|
|
|
|
|
GETFN(CreateOcrInitOptions) |
|
|
GETFN(OcrInitOptionsSetUseModelDelayLoad) |
|
|
GETFN(CreateOcrPipeline) |
|
|
GETFN(CreateOcrProcessOptions) |
|
|
GETFN(OcrProcessOptionsSetMaxRecognitionLineCount) |
|
|
GETFN(RunOcrPipeline) |
|
|
GETFN(GetImageAngle) |
|
|
GETFN(GetOcrLineCount) |
|
|
GETFN(GetOcrLine) |
|
|
GETFN(GetOcrLineContent) |
|
|
GETFN(GetOcrLineBoundingBox) |
|
|
GETFN(GetOcrLineWordCount) |
|
|
GETFN(GetOcrWord) |
|
|
GETFN(GetOcrWordContent) |
|
|
GETFN(GetOcrWordBoundingBox) |
|
|
GETFN(GetOcrWordConfidence) |
|
|
GETFN(ReleaseOcrResult) |
|
|
GETFN(ReleaseOcrInitOptions) |
|
|
GETFN(ReleaseOcrPipeline) |
|
|
GETFN(ReleaseOcrProcessOptions) |
|
|
|
|
|
|
|
|
char model_path[MAX_PATH]; |
|
|
snprintf(model_path, sizeof(model_path), "%s\\oneocr.onemodel", dll_dir); |
|
|
|
|
|
|
|
|
int key_len = strlen(key_hex) / 2; |
|
|
char key[64]; |
|
|
for (int i = 0; i < key_len && i < 63; i++) { |
|
|
sscanf(key_hex + i*2, "%2hhx", &key[i]); |
|
|
} |
|
|
key[key_len] = 0; |
|
|
|
|
|
|
|
|
long long init_opts = 0; |
|
|
pCreateOcrInitOptions(&init_opts); |
|
|
|
|
|
long long pipeline = 0; |
|
|
long long res = pCreateOcrPipeline(model_path, key, init_opts, &pipeline); |
|
|
if (res != 0) { |
|
|
fprintf(stderr, "{\"error\": \"CreateOcrPipeline failed: %lld\"}\n", res); |
|
|
return 1; |
|
|
} |
|
|
|
|
|
long long proc_opts = 0; |
|
|
pCreateOcrProcessOptions(&proc_opts); |
|
|
pOcrProcessOptionsSetMaxRecognitionLineCount(proc_opts, 200); |
|
|
|
|
|
|
|
|
int w = 0, h = 0; |
|
|
unsigned char* data = load_bmp_bgra(img_path, &w, &h); |
|
|
if (!data) { |
|
|
fprintf(stderr, "{\"error\": \"Failed to load image\"}\n"); |
|
|
return 1; |
|
|
} |
|
|
|
|
|
ImageStruct img = {3, w, h, 0, (long long)(w * 4), data}; |
|
|
|
|
|
|
|
|
long long result = 0; |
|
|
res = pRunOcrPipeline(pipeline, &img, proc_opts, &result); |
|
|
if (res != 0) { |
|
|
fprintf(stderr, "{\"error\": \"RunOcrPipeline failed: %lld\"}\n", res); |
|
|
return 1; |
|
|
} |
|
|
|
|
|
|
|
|
float angle = 0; |
|
|
pGetImageAngle(result, &angle); |
|
|
|
|
|
long long line_count = 0; |
|
|
pGetOcrLineCount(result, &line_count); |
|
|
|
|
|
|
|
|
char buf[65536]; |
|
|
int pos = 0; |
|
|
pos += snprintf(buf + pos, sizeof(buf) - pos, |
|
|
"{\"text_angle\": %.4f, \"lines\": [", angle); |
|
|
|
|
|
for (long long i = 0; i < line_count; i++) { |
|
|
long long line = 0; |
|
|
pGetOcrLine(result, i, &line); |
|
|
|
|
|
const char* line_text = NULL; |
|
|
pGetOcrLineContent(line, &line_text); |
|
|
|
|
|
BBox* line_bbox = NULL; |
|
|
pGetOcrLineBoundingBox(line, (void**)&line_bbox); |
|
|
|
|
|
long long word_count = 0; |
|
|
pGetOcrLineWordCount(line, &word_count); |
|
|
|
|
|
if (i > 0) pos += snprintf(buf + pos, sizeof(buf) - pos, ", "); |
|
|
|
|
|
char esc_line[4096]; |
|
|
json_escape(line_text ? line_text : "", esc_line, sizeof(esc_line)); |
|
|
|
|
|
pos += snprintf(buf + pos, sizeof(buf) - pos, |
|
|
"{\"text\": %s, \"bbox\": [%.1f,%.1f,%.1f,%.1f,%.1f,%.1f,%.1f,%.1f], \"words\": [", |
|
|
esc_line, |
|
|
line_bbox ? line_bbox->x1 : 0, line_bbox ? line_bbox->y1 : 0, |
|
|
line_bbox ? line_bbox->x2 : 0, line_bbox ? line_bbox->y2 : 0, |
|
|
line_bbox ? line_bbox->x3 : 0, line_bbox ? line_bbox->y3 : 0, |
|
|
line_bbox ? line_bbox->x4 : 0, line_bbox ? line_bbox->y4 : 0); |
|
|
|
|
|
for (long long j = 0; j < word_count; j++) { |
|
|
long long word = 0; |
|
|
pGetOcrWord(line, j, &word); |
|
|
|
|
|
const char* word_text = NULL; |
|
|
pGetOcrWordContent(word, &word_text); |
|
|
|
|
|
BBox* word_bbox = NULL; |
|
|
pGetOcrWordBoundingBox(word, (void**)&word_bbox); |
|
|
|
|
|
float word_conf = 0; |
|
|
pGetOcrWordConfidence(word, &word_conf); |
|
|
|
|
|
if (j > 0) pos += snprintf(buf + pos, sizeof(buf) - pos, ", "); |
|
|
|
|
|
char esc_word[2048]; |
|
|
json_escape(word_text ? word_text : "", esc_word, sizeof(esc_word)); |
|
|
|
|
|
pos += snprintf(buf + pos, sizeof(buf) - pos, |
|
|
"{\"text\": %s, \"confidence\": %.4f, \"bbox\": [%.1f,%.1f,%.1f,%.1f,%.1f,%.1f,%.1f,%.1f]}", |
|
|
esc_word, word_conf, |
|
|
word_bbox ? word_bbox->x1 : 0, word_bbox ? word_bbox->y1 : 0, |
|
|
word_bbox ? word_bbox->x2 : 0, word_bbox ? word_bbox->y2 : 0, |
|
|
word_bbox ? word_bbox->x3 : 0, word_bbox ? word_bbox->y3 : 0, |
|
|
word_bbox ? word_bbox->x4 : 0, word_bbox ? word_bbox->y4 : 0); |
|
|
} |
|
|
|
|
|
pos += snprintf(buf + pos, sizeof(buf) - pos, "]}"); |
|
|
} |
|
|
|
|
|
pos += snprintf(buf + pos, sizeof(buf) - pos, "]}"); |
|
|
|
|
|
|
|
|
printf("%s\n", buf); |
|
|
fflush(stdout); |
|
|
|
|
|
|
|
|
pReleaseOcrResult(result); |
|
|
free(data); |
|
|
pReleaseOcrProcessOptions(proc_opts); |
|
|
pReleaseOcrPipeline(pipeline); |
|
|
pReleaseOcrInitOptions(init_opts); |
|
|
FreeLibrary(hmod); |
|
|
|
|
|
return 0; |
|
|
} |
|
|
|