{"id":44653,"date":"2025-06-20T07:32:03","date_gmt":"2025-06-19T23:32:03","guid":{"rendered":"https:\/\/www.wsisp.com\/helps\/44653.html"},"modified":"2025-06-20T07:32:03","modified_gmt":"2025-06-19T23:32:03","slug":"%e7%99%be%e5%ba%a6ocr%e7%9a%84%e7%ae%80%e5%8d%95%e5%b0%81%e8%a3%85","status":"publish","type":"post","link":"https:\/\/www.wsisp.com\/helps\/44653.html","title":{"rendered":"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5"},"content":{"rendered":"<p>\u767e\u5ea6ocr\u5730\u5740<\/p>\n<p>\u4ee5\u4e0b\u4ee3\u7801\u4e3a\u5bf9\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5,\u5b9e\u9645\u4f7f\u7528\u65f6\u63a8\u8350\u4f7f\u7528baidu-aip<\/p>\n<p>\u767e\u5ea6\u901a\u7528ocr<\/p>\n<p><span class=\"token keyword\">import<\/span> base64<br \/>\n<span class=\"token keyword\">from<\/span> enum <span class=\"token keyword\">import<\/span> Enum<span class=\"token punctuation\">,<\/span> unique<br \/>\n<span class=\"token keyword\">import<\/span> requests<br \/>\n<span class=\"token keyword\">import<\/span> logging <span class=\"token keyword\">as<\/span> log<\/p>\n<p><span class=\"token decorator annotation punctuation\">&#064;unique<\/span><br \/>\n<span class=\"token keyword\">class<\/span> <span class=\"token class-name\">OcrType<\/span><span class=\"token punctuation\">(<\/span>Enum<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token comment\"># \u6807\u51c6\u7248<\/span><br \/>\n    STANDARD_BASIC <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/general_basic&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u6807\u51c6\u7248\u542b\u4f4d\u7f6e<\/span><br \/>\n    STANDARD_WITH_LOCATION <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/general&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u9ad8\u7cbe\u5ea6\u7248<\/span><br \/>\n    ACCURATE_BASIC <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/accurate_basic&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u9ad8\u7cbe\u5ea6\u7248\u542b\u4f4d\u7f6e<\/span><br \/>\n    ACCURATE_WITH_LOCATION <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/accurate&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u529e\u516c\u6587\u6863\u8bc6\u522b<\/span><br \/>\n    DOC_ANALYSiS_OFFICE <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/doc_analysis_office&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u7f51\u7edc\u56fe\u7247\u6587\u5b57\u8bc6\u522b<\/span><br \/>\n    WEB_IMAGE <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/webimage&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u7f51\u7edc\u56fe\u7247\u6587\u5b57\u8bc6\u522b \u542b\u4f4d\u7f6e<\/span><br \/>\n    WEB_IMAGE_WITH_LOCATION <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/webimage_loc&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u624b\u5199\u6587\u5b57\u8bc6\u522b<\/span><br \/>\n    HAND_WRITING <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/handwriting&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u6570\u5b57\u8bc6\u522b<\/span><br \/>\n    NUMBERS <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/numbers&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u8868\u683c\u6587\u5b57\u8bc6\u522b(\u540c\u6b65\u63a5\u53e3)<\/span><br \/>\n    FORM_SYNCH <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/form&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u8868\u683c\u6587\u5b57\u8bc6\u522b(\u5f02\u6b65\u63a5\u53e3)<\/span><br \/>\n    FORM_ASYNCH <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/solution\/v1\/form_ocr\/request&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u4e8c\u7ef4\u7801\u8bc6\u522b<\/span><br \/>\n    QRCORD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/qrcode&#034;<\/span><\/p>\n<p><span class=\"token keyword\">def<\/span> <span class=\"token function\">ocr_help<\/span><span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;\u767e\u5ea6ocr\u4f7f\u7528\u8bf4\u660e&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;\u672cAPI\u57fa\u4e8eocr\u901a\u7528\u8bc6\u522bapi\u7f16\u5199,\u5b98\u65b9\u6587\u6863\u5730\u5740:https:\/\/cloud.baidu.com\/doc\/OCR\/s\/zk3h7xz52&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;\u4f7f\u7528\u793a\u4f8b:&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token triple-quoted-string string\">&#039;&#039;&#039;<br \/>\n    baiduOcr &#061; BaiduGeneralOcr(OcrType.STANDARD_BASIC)<br \/>\n    baiduOcr.set_access_token(&#034;access_token&#034;)<br \/>\n    wordsList &#061; baiduOcr.recoginze(image&#061;&#034;D:\\\\\\\\txt1.png&#034;,options&#061;{})[&#039;words_result&#039;]<br \/>\n    for word in wordsList:<br \/>\n        print(word)<br \/>\n    &#039;&#039;&#039;<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p><span class=\"token keyword\">class<\/span> <span class=\"token class-name\">BaiduGeneralOcr<\/span><span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token comment\"># ocr\u7248\u672c<\/span><br \/>\n    ocr_type <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">0<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__init__<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> ocr_type<span class=\"token punctuation\">:<\/span> OcrType<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        ocr_type ocr\u8bc6\u522b\u7c7b\u578b STANDARD_BASIC\u6807\u51c6\u7248 \u6807\u51c6\u7248\u542b\u4f4d\u7f6eSTANDARD_WITH_LOCATION \u9ad8\u7cbe\u8bfb\u7248ACCURATE_BASIC \u9ad8\u7cbe\u5ea6\u7248\u542b\u4f4d\u7f6eACCURATE_WITH_LOCATION<br \/>\n        &#064;param ocr_type:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>options <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>pdf_file <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>url <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>image <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>ocr_type <span class=\"token operator\">&#061;<\/span> ocr_type<span class=\"token punctuation\">.<\/span>value<\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">gen_access_token<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> api_key<span class=\"token punctuation\">,<\/span> secret_key<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u751f\u6210access_token<br \/>\n        &#064;param api_key:<br \/>\n        &#064;param secret_key:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        request_url <span class=\"token operator\">&#061;<\/span> <span class=\"token string-interpolation\"><span class=\"token string\">f&#039;&#039;&#039;https:\/\/aip.baidubce.com\/oauth\/2.0\/token?grant_type&#061;client_credentials&amp;client_id&#061;<\/span><span class=\"token interpolation\"><span class=\"token punctuation\">{<\/span>api_key<span class=\"token punctuation\">}<\/span><\/span><span class=\"token string\">&amp;client_secret&#061;<\/span><span class=\"token interpolation\"><span class=\"token punctuation\">{<\/span>secret_key<span class=\"token punctuation\">}<\/span><\/span><span class=\"token string\">&#039;&#039;&#039;<\/span><\/span><br \/>\n        response <span class=\"token operator\">&#061;<\/span> requests<span class=\"token punctuation\">.<\/span>get<span class=\"token punctuation\">(<\/span>request_url<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> response<span class=\"token punctuation\">:<\/span><br \/>\n            <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;access_token:%s&#034;<\/span> <span class=\"token operator\">%<\/span><span class=\"token punctuation\">(<\/span>response<span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;access_token&#039;<\/span><span class=\"token punctuation\">]<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> response<span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;access_token&#039;<\/span><span class=\"token punctuation\">]<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__check<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u53c2\u6570\u68c0\u67e5<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        image <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>image<br \/>\n        url <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>url<br \/>\n        pdf_file <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>pdf_file<\/p>\n<p>        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> image <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>url <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> url <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>pdf_file <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> pdf_file <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            <span class=\"token keyword\">raise<\/span> ValueError<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image,url,pdf_file\u81f3\u5c11\u4f20\u5165\u4e00\u9879&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token operator\">!&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            f <span class=\"token operator\">&#061;<\/span> <span class=\"token builtin\">open<\/span><span class=\"token punctuation\">(<\/span>image<span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#039;rb&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;image&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> base64<span class=\"token punctuation\">.<\/span>b64encode<span class=\"token punctuation\">(<\/span>f<span class=\"token punctuation\">.<\/span>read<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>decode<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">elif<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> image <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>url <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">and<\/span> url <span class=\"token operator\">!&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;url&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> url<br \/>\n        <span class=\"token keyword\">else<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            f <span class=\"token operator\">&#061;<\/span> <span class=\"token builtin\">open<\/span><span class=\"token punctuation\">(<\/span>pdf_file<span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#039;rb&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;pdf_file&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> base64<span class=\"token punctuation\">.<\/span>b64encode<span class=\"token punctuation\">(<\/span>f<span class=\"token punctuation\">.<\/span>read<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>decode<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>        keys <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">.<\/span>keys<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;url&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;pdf_file&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            <span class=\"token keyword\">raise<\/span> ValueError<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image,url,pdf_file\u81f3\u5c11\u4f20\u5165\u4e00\u9879&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">try<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>ocr_type<span class=\"token punctuation\">.<\/span>value<br \/>\n        <span class=\"token keyword\">except<\/span> Exception <span class=\"token keyword\">as<\/span> e<span class=\"token punctuation\">:<\/span><br \/>\n            log<span class=\"token punctuation\">.<\/span>info<span class=\"token punctuation\">(<\/span><span class=\"token builtin\">repr<\/span><span class=\"token punctuation\">(<\/span>e<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>ocr_type <span class=\"token operator\">&#061;<\/span> OcrType<span class=\"token punctuation\">.<\/span>STANDARD_BASIC<br \/>\n            log<span class=\"token punctuation\">.<\/span>info<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;ocr_type\u7c7b\u578b,\u5df2\u91cd\u7f6e\u4e3a\u6807\u51c6\u7248&#034;<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__request<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> request_url<span class=\"token punctuation\">,<\/span> data<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token comment\"># \u8bbe\u7f6eheader<\/span><br \/>\n        headers <span class=\"token operator\">&#061;<\/span> <span class=\"token punctuation\">{<\/span><span class=\"token string\">&#039;content-type&#039;<\/span><span class=\"token punctuation\">:<\/span> <span class=\"token string\">&#039;application\/x-www-form-urlencoded&#039;<\/span><span class=\"token punctuation\">}<\/span><br \/>\n        <span class=\"token comment\"># \u8bf7\u6c42<\/span><br \/>\n        <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>headers<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">return<\/span> requests<span class=\"token punctuation\">.<\/span>post<span class=\"token punctuation\">(<\/span>request_url <span class=\"token operator\">&#043;<\/span> <span class=\"token string\">&#034;?access_token&#061;%s&#034;<\/span> <span class=\"token operator\">%<\/span> self<span class=\"token punctuation\">.<\/span>access_token<span class=\"token punctuation\">,<\/span> data<span class=\"token operator\">&#061;<\/span>self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">,<\/span><br \/>\n                             headers<span class=\"token operator\">&#061;<\/span>headers<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">recoginze<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> image<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> url<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> pdf_file<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> options<span class=\"token operator\">&#061;<\/span><span class=\"token boolean\">None<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u8bc6\u522b<br \/>\n        &#064;param image:<br \/>\n        &#064;param url:<br \/>\n        &#064;param pdf_file:<br \/>\n        &#064;param options:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>image <span class=\"token operator\">&#061;<\/span> image<br \/>\n        self<span class=\"token punctuation\">.<\/span>url <span class=\"token operator\">&#061;<\/span> url<br \/>\n        self<span class=\"token punctuation\">.<\/span>pdf_file <span class=\"token operator\">&#061;<\/span> pdf_file<br \/>\n        self<span class=\"token punctuation\">.<\/span>options <span class=\"token operator\">&#061;<\/span> options <span class=\"token keyword\">or<\/span> <span class=\"token punctuation\">{<\/span><span class=\"token punctuation\">}<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>__check<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token comment\"># \u53d1\u9001\u8bf7\u6c42<\/span><br \/>\n        <span class=\"token keyword\">return<\/span> self<span class=\"token punctuation\">.<\/span>__request<span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">.<\/span>ocr_type<span class=\"token punctuation\">.<\/span>value<span class=\"token punctuation\">,<\/span> options<span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">set_access_token<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> access_token<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u8bbe\u7f6eaccess_token<br \/>\n        &#064;param access_token:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> access_token<\/p>\n<p>\u767e\u5ea6\u5361\u7247\u8bc6\u522bocr<\/p>\n<p><span class=\"token keyword\">import<\/span> requests<br \/>\n<span class=\"token keyword\">import<\/span> base64<br \/>\n<span class=\"token keyword\">import<\/span> json<br \/>\n<span class=\"token keyword\">from<\/span> cwrpa<span class=\"token punctuation\">.<\/span>log<span class=\"token punctuation\">.<\/span>log <span class=\"token keyword\">import<\/span> logging <span class=\"token keyword\">as<\/span> log<br \/>\n<span class=\"token keyword\">from<\/span> enum <span class=\"token keyword\">import<\/span> Enum<span class=\"token punctuation\">,<\/span> unique<br \/>\n<span class=\"token keyword\">import<\/span> keyring<\/p>\n<p><span class=\"token decorator annotation punctuation\">&#064;unique<\/span><br \/>\n<span class=\"token keyword\">class<\/span> <span class=\"token class-name\">OcrType<\/span><span class=\"token punctuation\">(<\/span>Enum<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token comment\"># \u8eab\u4efd\u8bc1\u8bc6\u522b<\/span><br \/>\n    ID_CARD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/idcard&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u8eab\u4efd\u8bc1\u6df7\u8d34\u8bc6\u522b<\/span><br \/>\n    MULTI_IDCARD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/multi_idcard&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u8eab\u4efd\u8bc1\u8bc6\u522b(\u91d1\u878d\u52a0\u5bc6\u7248)<\/span><br \/>\n    IDCARD_ENC <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/idcard_enc&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u94f6\u884c\u5361\u8bc6\u522b<\/span><br \/>\n    BANKCARD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/bankcard&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u8425\u4e1a\u6267\u7167\u8bc6\u522b<\/span><br \/>\n    BUSINESS_LICENSE <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/business_license&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u540d\u7247\u8bc6\u522b<\/span><br \/>\n    BUSINESS_CARD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/business_card&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u62a4\u7167\u8bc6\u522b<\/span><br \/>\n    PASSPORT <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/passport&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u793e\u4fdd\u5361\u8bc6\u522b<\/span><br \/>\n    SOCIAL_SECURITY_CARD <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/social_security_card&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u6e2f\u6fb3\u901a\u884c\u8bc1\u8bc6\u522b<\/span><br \/>\n    HK_MACAU_EXITENTRYPERMIT <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/HK_Macau_exitentrypermit&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u53f0\u6e7e\u901a\u884c\u8bc1\u8bc6\u522b<\/span><br \/>\n    TAIWAN_EXITENTRYPERMIT <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034; https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/taiwan_exitentrypermit&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u6237\u53e3\u672c\u8bc6\u522b<\/span><br \/>\n    HOUSEHOLD_REGISTER <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/household_register&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u51fa\u751f\u533b\u5b66\u8bc6\u522b\u8bc1\u660e<\/span><br \/>\n    BITTH_CERTIFICATE <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/birth_certificate&#034;<\/span><br \/>\n    <span class=\"token comment\"># \u591a\u5361\u8bc1\u7c7b\u522b\u68c0\u6d4b<\/span><br \/>\n    MULTI_CARD_CLASSIFY <span class=\"token operator\">&#061;<\/span> <span class=\"token string\">&#034;https:\/\/aip.baidubce.com\/rest\/2.0\/ocr\/v1\/multi_card_classify&#034;<\/span><\/p>\n<p><span class=\"token keyword\">def<\/span> <span class=\"token function\">ocr_help<\/span><span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;\u767e\u5ea6ocr\u4f7f\u7528\u8bf4\u660e&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#061;&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;\u672cAPI\u57fa\u4e8eocr\u5361\u8bc1\u8bc6\u522bapi\u7f16\u5199,\u5b98\u65b9\u6587\u6863\u5730\u5740:https:\/\/ai.baidu.com\/ai-doc\/OCR\/rk3h7xzck&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;\u4f7f\u7528\u793a\u4f8b:&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n    <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span><span class=\"token triple-quoted-string string\">&#039;&#039;&#039;<br \/>\n    baiduOcr &#061; BaiduCardOcr(OcrType.ID_CARD)<br \/>\n    baiduOcr.set_access_token(&#034;access_token&#034;)<br \/>\n    wordsList &#061; baiduOcr.recoginze(image&#061;&#034;D:\\\\\\\\txt1.png&#034;,options&#061;{})[&#039;words_result&#039;]<br \/>\n    for word in wordsList:<br \/>\n        print(word)<br \/>\n    &#039;&#039;&#039;<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p><span class=\"token keyword\">class<\/span> <span class=\"token class-name\">BaiduCardOcr<\/span><span class=\"token punctuation\">:<\/span><br \/>\n    <span class=\"token comment\"># ocr\u7248\u672c<\/span><br \/>\n    ocr_type <span class=\"token operator\">&#061;<\/span> <span class=\"token number\">0<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__init__<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> ocr_type<span class=\"token punctuation\">:<\/span> OcrType<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        ocr_type ocr\u8bc6\u522b\u7c7b\u578b STANDARD_BASIC\u6807\u51c6\u7248 \u6807\u51c6\u7248\u542b\u4f4d\u7f6eSTANDARD_WITH_LOCATION \u9ad8\u7cbe\u8bfb\u7248ACCURATE_BASIC \u9ad8\u7cbe\u5ea6\u7248\u542b\u4f4d\u7f6eACCURATE_WITH_LOCATION<br \/>\n        &#064;param ocr_type:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>options <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>pdf_file <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>url <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>image <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>ocr_type <span class=\"token operator\">&#061;<\/span> ocr_type<span class=\"token punctuation\">.<\/span>value<\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">gen_access_token<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> api_key<span class=\"token punctuation\">,<\/span> secret_key<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u751f\u6210access_token<br \/>\n        &#064;param api_key:<br \/>\n        &#064;param secret_key:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        request_url <span class=\"token operator\">&#061;<\/span> <span class=\"token string-interpolation\"><span class=\"token string\">f&#039;&#039;&#039;https:\/\/aip.baidubce.com\/oauth\/2.0\/token?grant_type&#061;client_credentials&amp;client_id&#061;<\/span><span class=\"token interpolation\"><span class=\"token punctuation\">{<\/span>api_key<span class=\"token punctuation\">}<\/span><\/span><span class=\"token string\">&amp;client_secret&#061;<\/span><span class=\"token interpolation\"><span class=\"token punctuation\">{<\/span>secret_key<span class=\"token punctuation\">}<\/span><\/span><span class=\"token string\">&#039;&#039;&#039;<\/span><\/span><br \/>\n        response <span class=\"token operator\">&#061;<\/span> requests<span class=\"token punctuation\">.<\/span>get<span class=\"token punctuation\">(<\/span>request_url<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> response<span class=\"token punctuation\">:<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> response<span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;access_token&#039;<\/span><span class=\"token punctuation\">]<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__check<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u53c2\u6570\u68c0\u67e5<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        image <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>image<br \/>\n        url <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>url<br \/>\n        pdf_file <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>pdf_file<\/p>\n<p>        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> image <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>url <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> url <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>pdf_file <span class=\"token keyword\">is<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> pdf_file <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            <span class=\"token keyword\">raise<\/span> ValueError<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image,url,pdf_file\u81f3\u5c11\u4f20\u5165\u4e00\u9879&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token operator\">!&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            f <span class=\"token operator\">&#061;<\/span> <span class=\"token builtin\">open<\/span><span class=\"token punctuation\">(<\/span>image<span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#039;rb&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;image&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> base64<span class=\"token punctuation\">.<\/span>b64encode<span class=\"token punctuation\">(<\/span>f<span class=\"token punctuation\">.<\/span>read<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>decode<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">elif<\/span> <span class=\"token punctuation\">(<\/span>image <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">or<\/span> image <span class=\"token operator\">&#061;&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span>url <span class=\"token keyword\">is<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token boolean\">None<\/span> <span class=\"token keyword\">and<\/span> url <span class=\"token operator\">!&#061;<\/span> <span class=\"token string\">&#034;&#034;<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;url&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> url<br \/>\n        <span class=\"token keyword\">else<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            f <span class=\"token operator\">&#061;<\/span> <span class=\"token builtin\">open<\/span><span class=\"token punctuation\">(<\/span>pdf_file<span class=\"token punctuation\">,<\/span> <span class=\"token string\">&#039;rb&#039;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">[<\/span><span class=\"token string\">&#039;pdf_file&#039;<\/span><span class=\"token punctuation\">]<\/span> <span class=\"token operator\">&#061;<\/span> base64<span class=\"token punctuation\">.<\/span>b64encode<span class=\"token punctuation\">(<\/span>f<span class=\"token punctuation\">.<\/span>read<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>decode<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>        keys <span class=\"token operator\">&#061;<\/span> self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">.<\/span>keys<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">if<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;url&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span> <span class=\"token keyword\">and<\/span> <span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;pdf_file&#034;<\/span> <span class=\"token keyword\">not<\/span> <span class=\"token keyword\">in<\/span> keys<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            <span class=\"token keyword\">raise<\/span> ValueError<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;image,url,pdf_file\u81f3\u5c11\u4f20\u5165\u4e00\u9879&#034;<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">try<\/span><span class=\"token punctuation\">:<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>ocr_type<span class=\"token punctuation\">.<\/span>value<br \/>\n        <span class=\"token keyword\">except<\/span> Exception <span class=\"token keyword\">as<\/span> e<span class=\"token punctuation\">:<\/span><br \/>\n            log<span class=\"token punctuation\">.<\/span>info<span class=\"token punctuation\">(<\/span><span class=\"token builtin\">repr<\/span><span class=\"token punctuation\">(<\/span>e<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">)<\/span><br \/>\n            self<span class=\"token punctuation\">.<\/span>ocr_type <span class=\"token operator\">&#061;<\/span> OcrType<span class=\"token punctuation\">.<\/span>STANDARD_BASIC<br \/>\n            log<span class=\"token punctuation\">.<\/span>info<span class=\"token punctuation\">(<\/span><span class=\"token string\">&#034;ocr_type\u7c7b\u578b,\u5df2\u91cd\u7f6e\u4e3a\u6807\u51c6\u7248&#034;<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">__request<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> request_url<span class=\"token punctuation\">,<\/span> data<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token comment\"># \u8bbe\u7f6eheader<\/span><br \/>\n        headers <span class=\"token operator\">&#061;<\/span> <span class=\"token punctuation\">{<\/span><span class=\"token string\">&#039;content-type&#039;<\/span><span class=\"token punctuation\">:<\/span> <span class=\"token string\">&#039;application\/x-www-form-urlencoded&#039;<\/span><span class=\"token punctuation\">}<\/span><br \/>\n        <span class=\"token comment\"># \u8bf7\u6c42<\/span><br \/>\n        <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">print<\/span><span class=\"token punctuation\">(<\/span>headers<span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token keyword\">return<\/span> requests<span class=\"token punctuation\">.<\/span>post<span class=\"token punctuation\">(<\/span>request_url <span class=\"token operator\">&#043;<\/span> <span class=\"token string\">&#034;?access_token&#061;%s&#034;<\/span> <span class=\"token operator\">%<\/span> self<span class=\"token punctuation\">.<\/span>access_token<span class=\"token punctuation\">,<\/span> data<span class=\"token operator\">&#061;<\/span>self<span class=\"token punctuation\">.<\/span>options<span class=\"token punctuation\">,<\/span><br \/>\n                             headers<span class=\"token operator\">&#061;<\/span>headers<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">.<\/span>json<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">recoginze<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> image<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> url<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> pdf_file<span class=\"token punctuation\">:<\/span> <span class=\"token builtin\">str<\/span> <span class=\"token operator\">&#061;<\/span> <span class=\"token boolean\">None<\/span><span class=\"token punctuation\">,<\/span> options<span class=\"token operator\">&#061;<\/span><span class=\"token boolean\">None<\/span><span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u8bc6\u522b<br \/>\n        &#064;param image:<br \/>\n        &#064;param url:<br \/>\n        &#064;param pdf_file:<br \/>\n        &#064;param options:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>image <span class=\"token operator\">&#061;<\/span> image<br \/>\n        self<span class=\"token punctuation\">.<\/span>url <span class=\"token operator\">&#061;<\/span> url<br \/>\n        self<span class=\"token punctuation\">.<\/span>pdf_file <span class=\"token operator\">&#061;<\/span> pdf_file<\/p>\n<p>        self<span class=\"token punctuation\">.<\/span>options <span class=\"token operator\">&#061;<\/span> options <span class=\"token keyword\">or<\/span> <span class=\"token punctuation\">{<\/span><span class=\"token punctuation\">}<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>__check<span class=\"token punctuation\">(<\/span><span class=\"token punctuation\">)<\/span><br \/>\n        <span class=\"token comment\"># \u53d1\u9001\u8bf7\u6c42<\/span><br \/>\n        <span class=\"token keyword\">return<\/span> self<span class=\"token punctuation\">.<\/span>__request<span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">.<\/span>ocr_type<span class=\"token punctuation\">.<\/span>value<span class=\"token punctuation\">,<\/span> options<span class=\"token punctuation\">)<\/span><\/p>\n<p>    <span class=\"token keyword\">def<\/span> <span class=\"token function\">set_access_token<\/span><span class=\"token punctuation\">(<\/span>self<span class=\"token punctuation\">,<\/span> access_token<span class=\"token punctuation\">)<\/span><span class=\"token punctuation\">:<\/span><br \/>\n        <span class=\"token triple-quoted-string string\">&#034;&#034;&#034;<br \/>\n        \u8bbe\u7f6eaccess_token<br \/>\n        &#064;param access_token:<br \/>\n        &#064;return:<br \/>\n        &#034;&#034;&#034;<\/span><br \/>\n        self<span class=\"token punctuation\">.<\/span>access_token <span class=\"token operator\">&#061;<\/span> access_token<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u6587\u7ae0\u6d4f\u89c8\u9605\u8bfb1.7k\u6b21\u3002\u672c\u6587\u4ecb\u7ecd\u4e86\u767e\u5ea6OCR API\u7684\u4e24\u79cdPython\u5c01\u88c5\u5b9e\u73b0\u3002\u7b2c\u4e00\u90e8\u5206\u5c01\u88c5\u4e86\u767e\u5ea6\u901a\u7528OCR\u529f\u80fd\uff0c\u63d0\u4f9b\u4e86\u591a\u79cd\u8bc6\u522b\u7c7b\u578b\u9009\u9879\uff08\u6807\u51c6\/\u9ad8\u7cbe\u5ea6\u7248\u3001\u542b\u4f4d\u7f6e\u4fe1\u606f\u7248\u3001\u529e\u516c\u6587\u6863\u3001\u7f51\u7edc\u56fe\u7247\u3001\u624b\u5199\u6587\u5b57\u7b49\uff09\uff0c\u652f\u6301\u56fe\u7247\/URL\/PDF\u6587\u4ef6\u8f93\u5165\uff0c\u5305\u542baccess_token\u751f\u6210\u3001\u53c2\u6570\u68c0\u67e5\u7b49\u8f85\u52a9\u529f\u80fd\u3002\u7b2c\u4e8c\u90e8\u5206\u7b80\u8981\u63d0\u53ca\u4e86\u767e\u5ea6\u5361\u7247\u8bc6\u522bOCR\u7684\u5b9e\u73b0\uff0c\u540c\u6837\u57fa\u4e8ePython\u5c01\u88c5\uff0c\u4f46\u4ee3\u7801\u672a\u5b8c\u6574\u5c55\u793a\u3002\u4e24\u79cd\u5c01\u88c5\u90fd\u91c7\u7528\u9762\u5411\u5bf9\u8c61\u8bbe\u8ba1\uff0c\u901a\u8fc7\u679a\u4e3e\u7c7b\u578b\u7ba1\u7406\u4e0d\u540cOCR\u63a5\u53e3\uff0c\u9002\u7528\u4e8e\u9700\u8981\u6587\u5b57\u8bc6\u522b\u7684\u81ea\u52a8\u5316\u573a\u666f\u3002_\u767e\u5ea6ocr<\/p>\n","protected":false},"author":2,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[756,81,3691],"topic":[],"class_list":["post-44653","post","type-post","status-publish","format-standard","hentry","category-server","tag-ocr","tag-python","tag-3691"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v20.3 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.wsisp.com\/helps\/44653.html\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"og:description\" content=\"\u6587\u7ae0\u6d4f\u89c8\u9605\u8bfb1.7k\u6b21\u3002\u672c\u6587\u4ecb\u7ecd\u4e86\u767e\u5ea6OCR API\u7684\u4e24\u79cdPython\u5c01\u88c5\u5b9e\u73b0\u3002\u7b2c\u4e00\u90e8\u5206\u5c01\u88c5\u4e86\u767e\u5ea6\u901a\u7528OCR\u529f\u80fd\uff0c\u63d0\u4f9b\u4e86\u591a\u79cd\u8bc6\u522b\u7c7b\u578b\u9009\u9879\uff08\u6807\u51c6\/\u9ad8\u7cbe\u5ea6\u7248\u3001\u542b\u4f4d\u7f6e\u4fe1\u606f\u7248\u3001\u529e\u516c\u6587\u6863\u3001\u7f51\u7edc\u56fe\u7247\u3001\u624b\u5199\u6587\u5b57\u7b49\uff09\uff0c\u652f\u6301\u56fe\u7247\/URL\/PDF\u6587\u4ef6\u8f93\u5165\uff0c\u5305\u542baccess_token\u751f\u6210\u3001\u53c2\u6570\u68c0\u67e5\u7b49\u8f85\u52a9\u529f\u80fd\u3002\u7b2c\u4e8c\u90e8\u5206\u7b80\u8981\u63d0\u53ca\u4e86\u767e\u5ea6\u5361\u7247\u8bc6\u522bOCR\u7684\u5b9e\u73b0\uff0c\u540c\u6837\u57fa\u4e8ePython\u5c01\u88c5\uff0c\u4f46\u4ee3\u7801\u672a\u5b8c\u6574\u5c55\u793a\u3002\u4e24\u79cd\u5c01\u88c5\u90fd\u91c7\u7528\u9762\u5411\u5bf9\u8c61\u8bbe\u8ba1\uff0c\u901a\u8fc7\u679a\u4e3e\u7c7b\u578b\u7ba1\u7406\u4e0d\u540cOCR\u63a5\u53e3\uff0c\u9002\u7528\u4e8e\u9700\u8981\u6587\u5b57\u8bc6\u522b\u7684\u81ea\u52a8\u5316\u573a\u666f\u3002_\u767e\u5ea6ocr\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.wsisp.com\/helps\/44653.html\" \/>\n<meta property=\"og:site_name\" content=\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\" \/>\n<meta property=\"article:published_time\" content=\"2025-06-19T23:32:03+00:00\" \/>\n<meta name=\"author\" content=\"admin\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"admin\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"6 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/44653.html\",\"url\":\"https:\/\/www.wsisp.com\/helps\/44653.html\",\"name\":\"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"isPartOf\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\"},\"datePublished\":\"2025-06-19T23:32:03+00:00\",\"dateModified\":\"2025-06-19T23:32:03+00:00\",\"author\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\"},\"breadcrumb\":{\"@id\":\"https:\/\/www.wsisp.com\/helps\/44653.html#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.wsisp.com\/helps\/44653.html\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/44653.html#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/www.wsisp.com\/helps\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#website\",\"url\":\"https:\/\/www.wsisp.com\/helps\/\",\"name\":\"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3\",\"description\":\"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}\"},\"query-input\":\"required name=search_term_string\"}],\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41\",\"name\":\"admin\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"contentUrl\":\"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery\",\"caption\":\"admin\"},\"sameAs\":[\"http:\/\/wp.wsisp.com\"],\"url\":\"https:\/\/www.wsisp.com\/helps\/author\/admin\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.wsisp.com\/helps\/44653.html","og_locale":"zh_CN","og_type":"article","og_title":"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","og_description":"\u6587\u7ae0\u6d4f\u89c8\u9605\u8bfb1.7k\u6b21\u3002\u672c\u6587\u4ecb\u7ecd\u4e86\u767e\u5ea6OCR API\u7684\u4e24\u79cdPython\u5c01\u88c5\u5b9e\u73b0\u3002\u7b2c\u4e00\u90e8\u5206\u5c01\u88c5\u4e86\u767e\u5ea6\u901a\u7528OCR\u529f\u80fd\uff0c\u63d0\u4f9b\u4e86\u591a\u79cd\u8bc6\u522b\u7c7b\u578b\u9009\u9879\uff08\u6807\u51c6\/\u9ad8\u7cbe\u5ea6\u7248\u3001\u542b\u4f4d\u7f6e\u4fe1\u606f\u7248\u3001\u529e\u516c\u6587\u6863\u3001\u7f51\u7edc\u56fe\u7247\u3001\u624b\u5199\u6587\u5b57\u7b49\uff09\uff0c\u652f\u6301\u56fe\u7247\/URL\/PDF\u6587\u4ef6\u8f93\u5165\uff0c\u5305\u542baccess_token\u751f\u6210\u3001\u53c2\u6570\u68c0\u67e5\u7b49\u8f85\u52a9\u529f\u80fd\u3002\u7b2c\u4e8c\u90e8\u5206\u7b80\u8981\u63d0\u53ca\u4e86\u767e\u5ea6\u5361\u7247\u8bc6\u522bOCR\u7684\u5b9e\u73b0\uff0c\u540c\u6837\u57fa\u4e8ePython\u5c01\u88c5\uff0c\u4f46\u4ee3\u7801\u672a\u5b8c\u6574\u5c55\u793a\u3002\u4e24\u79cd\u5c01\u88c5\u90fd\u91c7\u7528\u9762\u5411\u5bf9\u8c61\u8bbe\u8ba1\uff0c\u901a\u8fc7\u679a\u4e3e\u7c7b\u578b\u7ba1\u7406\u4e0d\u540cOCR\u63a5\u53e3\uff0c\u9002\u7528\u4e8e\u9700\u8981\u6587\u5b57\u8bc6\u522b\u7684\u81ea\u52a8\u5316\u573a\u666f\u3002_\u767e\u5ea6ocr","og_url":"https:\/\/www.wsisp.com\/helps\/44653.html","og_site_name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","article_published_time":"2025-06-19T23:32:03+00:00","author":"admin","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"admin","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"6 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.wsisp.com\/helps\/44653.html","url":"https:\/\/www.wsisp.com\/helps\/44653.html","name":"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5 - \u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","isPartOf":{"@id":"https:\/\/www.wsisp.com\/helps\/#website"},"datePublished":"2025-06-19T23:32:03+00:00","dateModified":"2025-06-19T23:32:03+00:00","author":{"@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41"},"breadcrumb":{"@id":"https:\/\/www.wsisp.com\/helps\/44653.html#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.wsisp.com\/helps\/44653.html"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/www.wsisp.com\/helps\/44653.html#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/www.wsisp.com\/helps"},{"@type":"ListItem","position":2,"name":"\u767e\u5ea6ocr\u7684\u7b80\u5355\u5c01\u88c5"}]},{"@type":"WebSite","@id":"https:\/\/www.wsisp.com\/helps\/#website","url":"https:\/\/www.wsisp.com\/helps\/","name":"\u7f51\u7855\u4e92\u8054\u5e2e\u52a9\u4e2d\u5fc3","description":"\u9999\u6e2f\u670d\u52a1\u5668_\u9999\u6e2f\u4e91\u670d\u52a1\u5668\u8d44\u8baf_\u670d\u52a1\u5668\u5e2e\u52a9\u6587\u6863_\u670d\u52a1\u5668\u6559\u7a0b","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.wsisp.com\/helps\/?s={search_term_string}"},"query-input":"required name=search_term_string"}],"inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/358e386c577a3ab51c4493330a20ad41","name":"admin","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/www.wsisp.com\/helps\/#\/schema\/person\/image\/","url":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","contentUrl":"https:\/\/gravatar.wp-china-yes.net\/avatar\/?s=96&d=mystery","caption":"admin"},"sameAs":["http:\/\/wp.wsisp.com"],"url":"https:\/\/www.wsisp.com\/helps\/author\/admin"}]}},"_links":{"self":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/44653","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/comments?post=44653"}],"version-history":[{"count":0,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/posts\/44653\/revisions"}],"wp:attachment":[{"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/media?parent=44653"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/categories?post=44653"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/tags?post=44653"},{"taxonomy":"topic","embeddable":true,"href":"https:\/\/www.wsisp.com\/helps\/wp-json\/wp\/v2\/topic?post=44653"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}