aardio 文档

aardio 范例: 免费 OCR API(ocr.space)

相关范例 - 简单 OCR | 接口文档

//免费 OCR API(ocr.space)
//相关范例 - 简单 OCR: https://www.aardio.com/zh-cn/doc/example/Automation/ComputerVision/soImage.ocr.example.html

import win.ui;
import win.dlg.message;
import fonts.fontAwesome;
/*DSG{{*/
var winform = win.form(text="OCR 识别 - 自动导入剪贴板图像";right=1169;bottom=573)
winform.add(
bkplus={cls="bkplus";left=-17;top=516;right=1170;bottom=575;bgcolor=0xD2D2D2;db=1;dl=1;dr=1;z=1};
btnOcr={cls="plus";text="识别文本";left=843;top=533;right=940;bottom=563;align="left";color=0x3C3C3C;db=1;dr=1;font=LOGFONT(h=-13);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome');padding={left=8}};iconText='\uF0F6';notify=1;textPadding={left=25};z=6};
btnOpen={cls="plus";text="打开图像文件";left=366;top=532;right=499;bottom=562;align="left";color=0x3C3C3C;db=1;dl=1;font=LOGFONT(h=-13);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome');padding={left=8}};iconText='\uF03E';notify=1;textPadding={left=25};z=4};
btnPaste={cls="plus";text="粘粘自剪贴板";left=233;top=532;right=352;bottom=562;align="left";color=0x3C3C3C;db=1;dl=1;font=LOGFONT(h=-13);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome');padding={left=8}};iconText='\uF0EA';notify=1;textPadding={left=25};z=5};
btnScreenClip={cls="plus";text="截屏";left=149;top=532;right=219;bottom=562;align="left";color=0x3C3C3C;db=1;dl=1;font=LOGFONT(h=-13);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome');padding={left=8}};iconText='\uF030';notify=1;textPadding={left=25};z=10};
comboLanguage={cls="combobox";left=686;top=537;right=824;bottom=563;db=1;dr=1;edge=1;items={};mode="dropdown";vscroll=1;z=8};
edit={cls="richedit";left=589;top=0;right=1168;bottom=515;autohscroll=false;aw=1;db=1;dr=1;dt=1;edge=1;link=1;multiline=1;vscroll=1;z=3};
lbLanguage={cls="static";text="语言:";left=612;top=532;right=675;bottom=562;align="right";center=1;db=1;dr=1;transparent=1;z=9};
lnkOptimize={cls="plus";text="AI 优化";left=961;top=533;right=1048;bottom=563;align="left";color=0x3498DB;db=1;disabled=1;dr=1;font=LOGFONT(h=-14);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome')};iconText='\uF0D0 ';notify=1;textPadding={left=18};z=11};
lnkTranslate={cls="plus";text="AI 翻译";left=1063;top=533;right=1150;bottom=563;align="left";color=0x3498DB;db=1;disabled=1;dr=1;font=LOGFONT(h=-14);iconStyle={align="left";font=LOGFONT(h=-13;name='FontAwesome')};iconText='\uF0DB';notify=1;textPadding={left=18};z=12};
picturebox={cls="plus";text="请复制图像到剪贴板 / 或拖放文件到此处";left=0;top=0;right=584;bottom=515;aw=1;bgcolor=0xFFFFFF;color=0x999999;db=1;dl=1;dt=1;edge=1;font=LOGFONT(h=-16);iconStyle={font=LOGFONT(h=-60;name='FontAwesome')};iconText='\uF03E';repeat="scale";textPadding={top=100};z=2};
splitter={cls="splitter";left=583;top=0;right=588;bottom=515;bgcolor=0xFFFFFF;db=1;dt=1;frame=1;z=7}
)
/*}}*/

var ocr = function(winform,dataUrl){

    import web.rest.jsonLiteClient;
    var http = web.rest.jsonLiteClient();  

    // 此 API key 仅临时有效,稍后删除。
    var keyIndex = time().addDays(0).dayofyear%2 + 1;
    http.setHeaders( apikey = (["K83647549188957","K86141664788957"])[keyIndex] );
    /*
    自己申请一个永久免费 API key 非常简单 。

    1. 打开 https://mail.tm/zh/ 复制临时邮箱地址
    2. 打开 https://ocr.space/ocrapi/freekey 注册并输入上面的邮箱地址
    3. 回到 mail.tm 点刷新,点击确认邮件中的 “Yes, subscribe me to the free OCR API list.”
    4. 再次刷新并查收新邮件收到的  OCR API key 
    */

    // 接口文档: https://ocr.space/OCRAPI
    var ocrApi = http.api("https://api.ocr.space/");

    var langId = string.match(winform.comboLanguage.selText,"\s+(\w+)$");

    var result,err = ocrApi.parse.image({
        base64Image = dataUrl;
        language = langId; 
        OCREngine = 2;    // 引擎 2 对中文和特殊字符支持更好
        isTable = true;   // 表格或收据,这里只能指定为 true 否则报参数错。
    })

    if(result){
        // 检查 OCR 退出状态码 (1 为成功,2 为部分成功)
        if( result.OCRExitCode == 1 || result.OCRExitCode == 2 ){
            var parsedResults = result.ParsedResults;
            if(#parsedResults){ 
                var text  = table.map(parsedResults,lambda(v,k) v.ParsedText ) 
                winform.edit.text = string.join(text,'\n\n'); 
                winform.lnkTranslate.disabled = false;
                winform.lnkOptimize.disabled = false;
            } 
        }
        else {
             winform.edit.print(result.ErrorMessage || result.ErrorDetails || "OCR 失败");
        }
    } 
    else{
        if(err==`"The API key is invalid"`){
            winform.edit.text = "请到 https://ocr.space/ocrapi/freekey 输入邮箱并领取免费 key"
        }
        else  winform.edit.text = err||"未知错误"
    }

    winform.btnOcr.disabledText = null; 
    winform.picturebox.disabledText = null; 
}

winform.btnOcr.oncommand = function(id,event){
    if(winform.picturebox.backgroundBitmap){ 
        winform.edit.text = "识别中 ..."
        winform.btnOcr.disabledText = ['\uF254','\uF251','\uF252','\uF253','\uF250',text='识别中 ...']

        import inet.urlData;
        thread.invoke(ocr,winform,inet.urlData.fromBitmap(winform.picturebox.backgroundBitmap));
    }
    else {
        winform.msgErr("请先复制图像到剪贴板 / 或打开图像文件")
    } 
}

import fsys.dlg;
winform.btnOpen.oncommand = function(id,event){
    var path = fsys.dlg.open("图像文件|*.jpg;*.jpeg;*.jfif;*.bmp;*.gif;*.png;*.tif;*.tiff;*.webp||",,,winform)
    if(path){
        if(string.endsWith(path,".webp",true)){
            import gdip.webp;
        }
        winform.picturebox.background = path; 
        winform.picturebox.backgroundBitmap = gdip.bitmap(path);
        winform.picturebox.text = null;
        winform.picturebox.iconText = null;
    }
}

winform.lnkTranslate.oncommand = function(id,event){
    var text = string.trim(winform.edit.text);
    if(#text){
        import web.edgeTextToSpeech.translate; 
        var transForm = web.edgeTextToSpeech.translate(,text) 
        transForm.text = "OCRAPI 中英翻译 - 此页面支持英文划词速查";
        transForm.doModal();
    } 
    else {
        winform.msgErr("识别结果为空")
    } 
}

winform.onDropFiles = function(files){
    var path = files[1]
    if(path){
        if(string.endsWith(path,".webp",true)){
            import gdip.webp;
        }

        winform.picturebox.backgroundBitmap = gdip.bitmap(path);
        if(winform.picturebox.backgroundBitmap){
            winform.picturebox.background = path; 
        } 
    }
}

import win.clip.bitmap;
winform.btnPaste.oncommand = function(id,event){
    var bmp = win.clip.bitmap.read()
    if(bmp){ 
        winform.picturebox.backgroundBitmap = bmp;
        winform.picturebox.background = bmp;
        winform.picturebox.text = null;
        winform.picturebox.iconText = null;
    }
}

import win.clip.viewer;
winform.clipViewer = win.clip.viewer(winform);
winform.clipViewer.onDrawClipboard = function(){ 
    if(winform.screenclip){ 
        win.showForeground(winform.hwnd);
        winform.screenclip = false
    }
    winform.btnPaste.oncommand();
}
winform.btnPaste.oncommand()

winform.btnScreenClip.oncommand = function(id,event){
    winform.show(6/*_SW_MINIMIZE*/);
    winform.screenclip = true;

    import win.clip.screen;
    win.clip.screen();
}

winform.onActivate = function(state,hwndOther,minimized){
    if(state){
        winform.screenclip = false;     
    }
} 

winform.edit.enablePopMenu()

winform.splitter.split(winform.picturebox,winform.edit);

// 定义一个统一的按钮皮肤样式
var btnSkin = {
    color = {
        default = 0xFF3C3C3C; // 默认深灰色文本
        hover = 0xFF0078D4;   // 鼠标悬停变蓝色
        active = 0xFF005A9E;  // 鼠标按下变深蓝色
        disabled = 0xFFAAAAAA; // 禁用状态灰色
    };
    background = {
        hover = 0x1A0078D4;   // 悬停时淡淡的背景色
        active = 0x330078D4;  // 按下时稍深的背景色
    }
}

// 批量为所有按钮应用样式
for i,ctrl in [
    winform.btnPaste,
    winform.btnOcr,
    winform.lnkTranslate,
    winform.btnOpen,
    winform.btnScreenClip
] {
    ctrl.skin(btnSkin);
}

winform.lnkOptimize.skin({
    color = {
        default = 0xFF3498DB;
        hover = 0xFF2980B9;
        active = 0xFF1F618D;
         disabled=0xFFAAAAAA;
    }
})

winform.lnkTranslate.skin({
    color = {
        default = 0xFF3498DB;
        hover = 0xFF2980B9;
        active = 0xFF1F618D;
         disabled=0xFFAAAAAA;
    }
})

/*
支持的全部语言
Arabic=ara
Bulgarian=bul
Chinese(Simplified)=chs
Chinese(Traditional)=cht
Croatian = hrv
Czech = cze
Danish = dan
Dutch = dut
English = eng
Finnish = fin
French = fre
German = ger
Greek = gre
Hungarian = hun
Korean = kor
Italian = ita
Japanese = jpn
Polish = pol
Portuguese = por
Russian = rus
Slovenian = slv
Spanish = spa
Swedish = swe
Thai = tha
Turkish = tur
Ukrainian = ukr
Vietnamese = vnm

全部添加到下拉框,格式例如
winform.comboLanguage.items = ["自动检测","简体中文 chs","繁体中文 cht","英文 enu"]

所有语言有空格分开标题与 ID,以便在程序中自动提取后面的语言 ID
*/
winform.comboLanguage.items = {
    "自动检测 auto";
    "简体中文 chs";
    "繁体中文 cht";
    "阿拉伯语 ara";
    "保加利亚语 bul";
    "克罗地亚语 hrv";
    "捷克语 cze";
    "丹麦语 dan";
    "荷兰语 dut";
    "英语 eng";
    "芬兰语 fin";
    "法语 fre";
    "德语 ger";
    "希腊语 gre";
    "匈牙利语 hun";
    "韩语 kor";
    "意大利语 ita";
    "日语 jpn";
    "波兰语 pol";
    "葡萄牙语 por";
    "俄语 rus";
    "斯洛文尼亚语 slv";
    "西班牙语 spa";
    "瑞典语 swe";
    "泰语 tha";
    "土耳其语 tur";
    "乌克兰语 ukr";
    "越南语 vnm"
}

winform.lnkOptimize.oncommand = function(id,event){
    var text = string.trim(winform.edit.text);
    if(!#text){
        return winform.msgboxErr("识别结果为空")
    }

    winform.btnOcr.disabled = true;
    winform.lnkTranslate.disabled = true; 
    winform.lnkOptimize.disabledText = ['\uF254','\uF251','\uF252','\uF253','\uF250']

    thread.invoke( 
        function(winform,text){

            import web.rest.aiChat;
            var aiClient = web.rest.aiChat(
                key =   '\0\1\96';
                url = "https://ai.aardio.com/api/v1/";//接口地址
                model = "prompt";
                temperature = 0.5;//温度
                maxTokens = 1024 //最大回复长度
            )

            //2. 第二步:创建消息队列,必须在这里保存对话,不然 AI 的回复没有上下文。
            //---------------------------------------------------------------------
            var msg = web.rest.aiChat.message();

            //可调用 msg.system() 函数添加系统提示词。
            msg.system(`# 角色
你是一位 OCR 图文识别结果修复工程师。

# 任务

用户输入的文本是使用 OCR 图文识别工具的识别结果。
你的任务是在尊重图文原意的基础上对识别结果进行评估与修复,纠正识别错误。

你应当根据文本相关的文化与背景知识对识别结果的格式进行整理。
如果识别结果中出现与前后文本完全不相关的多余字符应当去除(较大可能可以判定为 OCR 工具将非字符图形误判为文字)。

输出格式为纯文本,不使用 Markdown 标记(除非识别结果本身包含 Markdown 标记)。

# 要求  
无需解释你的思考过程,直接输入回复。
`)


            //添加用户提示词
            msg.prompt( "请修复 OCR 识别结果: " + text );

            winform.edit.text = "";

            var resp,err = aiClient.messages(msg,
                function(deltaText,reasoning){
                     if(deltaText) winform.edit.appendText(deltaText); 

                }
            );

            winform.btnOcr.disabled = false;
            winform.lnkTranslate.disabled = false; 
            winform.lnkOptimize.disabledText = null;
        },winform,text
    )   
}

winform.comboLanguage.selIndex = 1;

winform.show()
win.loopMessage();
Markdown 格式