297.html 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682
  1. <!DOCTYPE html>
  2. <html lang="en" data-default-color-scheme=auto>
  3. <head><!-- hexo injector head_begin start -->
  4. <script async src="https://analytics.umami.is/script.js" data-website-id="e59ec28a-c9a7-4104-9e62-a9f7eb3fac0b"></script>
  5. <!-- hexo injector head_begin end -->
  6. <meta charset="UTF-8">
  7. <link rel="apple-touch-icon" sizes="76x76" href="https://img.limour.top/2023/08/29/64ee07361815a.webp">
  8. <link rel="icon" href="https://img.limour.top/2023/08/29/64ee07361815a.webp">
  9. <meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=5.0, shrink-to-fit=no">
  10. <meta http-equiv="x-ua-compatible" content="ie=edge">
  11. <meta name="theme-color" content="#2f4154">
  12. <meta name="author" content="Limour">
  13. <meta name="keywords" content="">
  14. <meta name="description" content="123456789101112131415161718192021222324252627282930313233343536from PIL import Image#from itertools import cycleimport os, randomimport pytesseractconfig &#x3D; &quot;--psm 8 --oem 0 -c tessedit_char_white">
  15. <meta property="og:type" content="article">
  16. <meta property="og:title" content="pytesseract测试">
  17. <meta property="og:url" content="https://b.limour.top/297.html">
  18. <meta property="og:site_name" content="Limour&#39;s Blog">
  19. <meta property="og:description" content="123456789101112131415161718192021222324252627282930313233343536from PIL import Image#from itertools import cycleimport os, randomimport pytesseractconfig &#x3D; &quot;--psm 8 --oem 0 -c tessedit_char_white">
  20. <meta property="og:locale" content="en_US">
  21. <meta property="og:image" content="https://img-cdn.limour.top/blog_wp/2020/07/%E5%BE%AE%E4%BF%A1%E5%9B%BE%E7%89%87_20200702203134.png">
  22. <meta property="article:published_time" content="2020-07-02T11:37:35.000Z">
  23. <meta property="article:modified_time" content="2023-09-01T13:32:00.433Z">
  24. <meta property="article:author" content="Limour">
  25. <meta property="article:tag" content="Python">
  26. <meta property="article:tag" content="tesseract">
  27. <meta property="article:tag" content="Captcha">
  28. <meta property="article:tag" content="OCR">
  29. <meta name="twitter:card" content="summary_large_image">
  30. <meta name="twitter:image" content="https://img-cdn.limour.top/blog_wp/2020/07/%E5%BE%AE%E4%BF%A1%E5%9B%BE%E7%89%87_20200702203134.png">
  31. <title>pytesseract测试 - Limour&#39;s Blog</title>
  32. <link rel="stylesheet" href="https://jscdn.limour.top/npm/bootstrap@4.6.1/dist/css/bootstrap.min.css" />
  33. <link rel="stylesheet" href="https://jscdn.limour.top/npm/github-markdown-css@4.0.0/github-markdown.min.css" />
  34. <link rel="stylesheet" href="https://jscdn.limour.top/npm/hint.css@2.7.0/hint.min.css" />
  35. <link rel="stylesheet" href="https://lib.baomitu.com/fancybox/3.5.7/jquery.fancybox.min.css" />
  36. <!-- 主题依赖的图标库,不要自行修改 -->
  37. <!-- Do not modify the link that theme dependent icons -->
  38. <link rel="stylesheet" href="//at.alicdn.com/t/font_1749284_hj8rtnfg7um.css">
  39. <link rel="stylesheet" href="//at.alicdn.com/t/font_1736178_lbnruvf0jn.css">
  40. <link rel="stylesheet" href="/css/main.css" />
  41. <link id="highlight-css" rel="stylesheet" href="/css/highlight.css" />
  42. <link id="highlight-css-dark" rel="stylesheet" href="/css/highlight-dark.css" />
  43. <link rel="stylesheet" href="/theme-inject/custom.css">
  44. <script id="fluid-configs">
  45. var Fluid = window.Fluid || {};
  46. Fluid.ctx = Object.assign({}, Fluid.ctx)
  47. var CONFIG = {"hostname":"b.limour.top","root":"/","version":"1.9.5-a","typing":{"enable":true,"typeSpeed":70,"cursorChar":"_","loop":false,"scope":[]},"anchorjs":{"enable":true,"element":"h1,h2,h3,h4,h5,h6","placement":"left","visible":"hover","icon":"§"},"progressbar":{"enable":true,"height_px":3,"color":"#29d","options":{"showSpinner":false,"trickleSpeed":100}},"code_language":{"enable":true,"default":"TEXT"},"copy_btn":true,"image_caption":{"enable":true},"image_zoom":{"enable":true,"img_url_replace":["",""]},"toc":{"enable":true,"placement":"right","headingSelector":"h1,h2,h3,h4,h5,h6","collapseDepth":0},"lazyload":{"enable":true,"loading_img":"https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg","onlypost":false,"offset_factor":2},"web_analytics":{"enable":false,"follow_dnt":true,"baidu":null,"google":{"measurement_id":null},"tencent":{"sid":null,"cid":null},"woyaola":null,"cnzz":null,"leancloud":{"app_id":null,"app_key":null,"server_url":null,"path":"window.location.pathname","ignore_local":false}},"search_path":"/local-search.xml","include_content_in_search":true};
  48. if (CONFIG.web_analytics.follow_dnt) {
  49. var dntVal = navigator.doNotTrack || window.doNotTrack || navigator.msDoNotTrack;
  50. Fluid.ctx.dnt = dntVal && (dntVal.startsWith('1') || dntVal.startsWith('yes') || dntVal.startsWith('on'));
  51. }
  52. </script>
  53. <script src="/js/utils.js" ></script>
  54. <script src="/js/color-schema.js" ></script>
  55. <meta name="generator" content="Hexo 6.3.0"></head>
  56. <body>
  57. <header>
  58. <div class="header-inner" style="height: 70vh;">
  59. <nav id="navbar" class="navbar fixed-top navbar-expand-lg navbar-dark scrolling-navbar">
  60. <div class="container">
  61. <a class="navbar-brand" href="/">
  62. <strong>Limour&#39;s Blog</strong>
  63. </a>
  64. <button id="navbar-toggler-btn" class="navbar-toggler" type="button" data-toggle="collapse"
  65. data-target="#navbarSupportedContent"
  66. aria-controls="navbarSupportedContent" aria-expanded="false" aria-label="Toggle navigation">
  67. <div class="animated-icon"><span></span><span></span><span></span></div>
  68. </button>
  69. <!-- Collapsible content -->
  70. <div class="collapse navbar-collapse" id="navbarSupportedContent">
  71. <ul class="navbar-nav ml-auto text-center">
  72. <li class="nav-item">
  73. <a class="nav-link" href="/">
  74. <i class="iconfont icon-home-fill"></i>
  75. <span>Home</span>
  76. </a>
  77. </li>
  78. <li class="nav-item">
  79. <a class="nav-link" href="/archives/">
  80. <i class="iconfont icon-archive-fill"></i>
  81. <span>Archives</span>
  82. </a>
  83. </li>
  84. <li class="nav-item" id="search-btn">
  85. <a class="nav-link" target="_self" href="javascript:;" data-toggle="modal" data-target="#modalSearch" aria-label="Search">
  86. <i class="iconfont icon-search"></i>
  87. </a>
  88. </li>
  89. <li class="nav-item" id="color-toggle-btn">
  90. <a class="nav-link" target="_self" href="javascript:;" aria-label="Color Toggle">
  91. <i class="iconfont icon-dark" id="color-toggle-icon"></i>
  92. </a>
  93. </li>
  94. </ul>
  95. </div>
  96. </div>
  97. </nav>
  98. <div id="banner" class="banner" parallax=true
  99. style="background: url('https://img.limour.top/2023/08/29/64ee08e108638.webp') no-repeat center center; background-size: cover;">
  100. <div class="full-bg-img">
  101. <div class="mask flex-center" style="background-color: rgba(0, 0, 0, 0.3)">
  102. <div class="banner-text text-center fade-in-up">
  103. <div class="h2">
  104. <span id="subtitle" data-typed-text="pytesseract测试"></span>
  105. </div>
  106. <div class="mt-3">
  107. <span class="post-meta">
  108. <i class="iconfont icon-date-fill" aria-hidden="true"></i>
  109. <time datetime="2020-07-02 19:37" pubdate>
  110. July 2, 2020 pm
  111. </time>
  112. </span>
  113. </div>
  114. <div class="mt-1">
  115. <span class="post-meta mr-2">
  116. <i class="iconfont icon-chart"></i>
  117. 2.8k words
  118. </span>
  119. <span class="post-meta mr-2">
  120. <i class="iconfont icon-clock-fill"></i>
  121. 24 mins
  122. </span>
  123. </div>
  124. </div>
  125. </div>
  126. </div>
  127. </div>
  128. </div>
  129. </header>
  130. <main>
  131. <div class="container-fluid nopadding-x">
  132. <div class="row nomargin-x">
  133. <div class="side-col d-none d-lg-block col-lg-2">
  134. </div>
  135. <div class="col-lg-8 nopadding-x-md">
  136. <div class="container nopadding-x-md" id="board-ctn">
  137. <div id="board">
  138. <article class="post-content mx-auto">
  139. <h1 id="seo-header">pytesseract测试</h1>
  140. <div class="markdown-body">
  141. <figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br></pre></td><td class="code"><pre><code class="hljs python"><span class="hljs-keyword">from</span> PIL <span class="hljs-keyword">import</span> Image<br><span class="hljs-comment">#from itertools import cycle</span><br><span class="hljs-keyword">import</span> os, random<br><span class="hljs-keyword">import</span> pytesseract<br>config = <span class="hljs-string">&quot;--psm 8 --oem 0 -c tessedit_char_whitelist=abcdefghijklmnopqrstuvwxyz&quot;</span><br><span class="hljs-keyword">def</span> <span class="hljs-title function_">tesOCR</span>(<span class="hljs-params">img</span>):<br> <span class="hljs-keyword">return</span> pytesseract.image_to_string(img, lang=<span class="hljs-string">&#x27;eng&#x27;</span>, config=config)<br><br><br><span class="hljs-keyword">class</span> <span class="hljs-title class_">Fileset</span>(<span class="hljs-title class_ inherited__">list</span>):<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__init__</span>(<span class="hljs-params">self, name, ext=<span class="hljs-string">&#x27;&#x27;</span>, _read=<span class="hljs-literal">None</span>, root=<span class="hljs-literal">None</span></span>):<br> <span class="hljs-keyword">if</span> <span class="hljs-built_in">isinstance</span>(name, <span class="hljs-built_in">str</span>) :<br> self.root = os.path.join(root <span class="hljs-keyword">or</span> os.getcwd(), name)<br> self.extend(f <span class="hljs-keyword">for</span> f <span class="hljs-keyword">in</span> os.listdir(self.root) <span class="hljs-keyword">if</span> f.endswith(ext))<br> self._read = _read<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__getitem__</span>(<span class="hljs-params">self, index</span>):<br> <span class="hljs-keyword">if</span> <span class="hljs-built_in">isinstance</span>(index, <span class="hljs-built_in">int</span>):<span class="hljs-comment"># index是索引</span><br> <span class="hljs-keyword">return</span> os.path.join(self.root, <span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">else</span>:<span class="hljs-comment"># index是切片</span><br> fileset = Fileset(<span class="hljs-literal">None</span>)<br> fileset.root = self.root<br> fileset._read = self._read<br> fileset.extend(<span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">return</span> fileset<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">getFileName</span>(<span class="hljs-params">self, index</span>):<br> fname, ext = os.path.splitext(<span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">return</span> fname<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__iter__</span>(<span class="hljs-params">self</span>):<br> <span class="hljs-keyword">return</span> (os.path.join(self.root, f) <span class="hljs-keyword">for</span> f <span class="hljs-keyword">in</span> <span class="hljs-built_in">super</span>().__iter__())<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__call__</span>(<span class="hljs-params">self</span>):<br> retn = random.choice(self)<br> <span class="hljs-keyword">if</span> self._read: <span class="hljs-keyword">return</span> self._read(retn)<br> <span class="hljs-keyword">else</span>: <span class="hljs-keyword">return</span> retn<br><br>sample = Fileset(<span class="hljs-string">&#x27;Captcha&#x27;</span>, <span class="hljs-string">&#x27;.jpg&#x27;</span>, Image.<span class="hljs-built_in">open</span>)<br><br></code></pre></td></tr></table></figure>
  142. <p><a target="_blank" rel="noopener" href="https://limour.lanzous.com/iqHJfdxripg"><img src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAL4AAAC+CAYAAACLdLWdAAAPfUlEQVR4Xu2dUXbbOhJEJytzlp6dZQ4t+lGm2MQtFEBJTs3vNIBG9UWxAcd+vz4+Pv7+70X+9+fPHyuT379/P4w/mvMoTlmYzkn34+RdrUH36OyF5r1oS/NR6uDE/gr4unwOLEerUYBonAKas5cZ+ejV6BsR8Dt0c2AJ+B2CTxgS8DtEDfg30eL4HfAcDaE9cbUcLYTbbwb8Hwq+CyA5BxRSMtdXjDOnM1ZxP+fQKXVx9uOMdU1JqTeJrfQ+bHUUgcniTl+rzO8UzBkb8NtVcvVtr3AcEfAbyrmFoePj+FshnmWwSwZx/LUOFFz3Ux7wA/4DQ64DOPA6Y9PqtBsRV9/2CpNandFO9SwhKkiVVyaqhXOQ3TWovnQdRR/nTjc6H7vHvyIhBxTFEeheZvxzAJrnjBzpMyzNUanXsw5iwL+r5gyoXEfcj5+RY8DfVMaXW1oICgB1AOo+ShzdSxz/XNU4foM66jSKkAroV7gpPfA07xmHk9aB5qjUixod3TfV+8e1Os8S0n3OHH3xuwo+ZZ3Re3QOYsCn6t3FKcWmB3E0FDNydPbiGkMcvwEqLc5oId3CBvxNgStarzh+HB//M2JqKoqkdM7RRhXwlSqtsTPaiDh+HP+BAeX5UIGyg/nTIY4r0dcImvPoXOi6S5xSgzj+qiwVYglXYpXC9caOhk0BaJ/z6FwUTZS8aQ2d/Sh3hrf4ARYVTSmaE+sUJ46fVietTsddIo5fW1Yc37FzMDaOfxPpn2h1AA9SyDPbFwquUlj6WkNbnVfTZ4YW7pwEOPs5kyyixLxaYSmQ7h7pOq+mjwvps/YT8O+Ii+OfH98ZkM6Yk5hQwA/4hJPPmBmQzpiTbCjgB3zCyb8NPlZocKD7k1vqKk5c9ZrhzEmf4Wjcq+VYfUUG4yNN9xZ/OzNQ1c+H1aecHpIr4gJ+40zG8TeBnMMex2+bfxx/1Yg636tBFcdvQ34UEfAD/gMXztdG+Wr3ITtm1K+/f/++zH8KqNrSVe/uVFInH2fsUX6K4yvjqRb7OPcHXb3rquMCvqqY8N9zUtqnXoACfkcBlz8aG8fXhXNc2xmrODZ1XpoPVYmuS+ebFRfwO5SlsMTxO8S9aEjA7xA64NeixfE7gMrldlOAApQevw807PiOyym9Kd2GAwZtQZSnOXdOum8njtaQrkH3XM1Hx9Na07yXuIC/qkXfrpdwGkvjlII5sQF/Uy/gB/zus0QdO45/p4DrPvTzR12XxsXxz+8hSl3pwaG1Vk5wHD+Or/DyLZaC++Mcn55E6qaKWxyJ6RaCEkD3TS/1NG8at6xLc3RqQ9dQXuuUPe7nVfKxHJ8u5IhLYayK7R4mesBono4WChRX1IauEfDvFFCKSKGaMWfAvylADyytlTInNS/lIMbxlUqtsYrA++kpQE5cWp12UQN+W6OHiIB/k8TR4cc5vutUtLVw1qEFU/45gJMP3TO9LCtQ0ryVtUfvx6lXNXa441Mhad+mXFppj+8IOSOf0aAE/E3RgN+4WCuO5hwweuBnHE66R3ft0QfZySfgB/zD2wz9QtNDU12ZZsDb+3CwjEurc3K5TY9/fvOnX69ntl6l4398fEz/ZXN62iuZFYE7HmnkIbTVoRNTfRx3rl5RnBxn5DNa22p/l/x5EVrYgK87rKKtYyAUSDcfug49sAHfVapxRxgNFe2pXdCoLBRINx+6Ds074LtKBfwHBdPqNKBSXIA63UCO5alGuxLVZwZodPN0z3Qv1Z2DrkPzlhyfLk436bQB7gZpjso6FEAnjubj7u/VauNoRrldtLX+O7dU9FcTl0KlXLap6DSO5khroOyFru3GUS1GxwX8zspd5UokvYC/qUQPSMAnZB3EBPxO4XbDKKij4wJ+Z/0CfqdwrwQ+/aOxtE93P71UUgqfM181drQDUc2UPdN6UX1oXLUXJx+qN83x0/ED/k0upTC0EE7cURED/qaKUq8jLQP+qooipAO0Au++YMpYZT+KU7Zi4/gthcz/X4GALKWAEvBrRQM+oc2ICfg38WaAZpRlSj7UaJS8cavj9pzks61cJukm6QFRHJ+ufRRHi+jEOfm5YxUdnT3SdSpjCPgdPb4Dx+hi0xchJ2dlLAWy+lqNNqqAf1c9Cp9ScBpL13biaC4z4gJ+Q1VXIFq00Q5C11XaNifHOP55ReL4cXz3zKLxrqE5JkDvVEtcevz0+AhoGvTjwKcbcnpTukZ1MaIvT4oz0II7ccq+9+sorQ51U6qjsjad06mNoiN2fDppwNePANXWgWIZG/A3BQP+qoXrXjru24iA33dB3Y9SdAz4AR+dWedrUS1AQaWmROeTLrd00rQ6iKNvQVTbtDrn2io6Wn9Qip5EerFx5qt6WAcWRUjnwOtHpW8E3c+r7WV03p+O7/wJQQfUn/bpfDVYqNlQY5hRL3p8A35DKUcgB5RlbMCnGOtxTl2rsXH8kzpQwQO+DrMygtaBmk9anUFfkICvYKzHTgH/6HduaT9H4+hWqw3Sk0zvHDRvKni1Pycfp/d286FtH92f+/BA60Xz/nT8gH+Tix4ueoirOZXi7GPdHBVQ92s78AX8ztaCFpwWlhYxjr8VjGpWlZhqeUWt4/h3VaKCx/E3BajRxPHj+IcKjHbD9PjnX6pPx7/iB1i0sErB6JzUlWZ8yunatO935lO+VDQfZU6aO60DrX+VY8BflaGCKz0sLTYFzZlPgZTmo8xJc6d1CPgN9UcLHvAV3PX7QMAfdPEM+H2g7ke5Dju6Dm4+aXXS6qCT4YL2cuDTH2AhdYogZ9PLlHT8jN6U7tt5DqVjaZzySEA1c2pANVzi6AFztcA/uVWS38dS0ZR/skDzoULS+RSo6Nq0iDROyTHg3ylAC0ZhCfjnSlGgaVzAb5MZx29rhCIcKOlYGhfw2yUL+G2NUIQDJR1L4wJ+u2QW+LQQTly1Bee9d0Y+balvEbSNpO0hXVdZ+2jOqzRz9KFMLPsL+GuVFdEU2PaxTmGddQP+d/UCfsBH5ymOfyeTI4brsHT86DhEyUlQHP9cQUcfWuu0Onc1UERz4HcK66ybVqez1aGXrRkAjYaFzqeARr9+9OKorH0UO6MObk7kvuNwpmiLe3wnITq2EpaCSteh8ymFDviKWrdY53DSGlZMBHy9XocjAr4uZMBvaOaebvKJ1cv2fUTA1xUM+AFfp6ZDM9oKDk+mmPCp4I/+nVvqzleJSy88M/KmXwEnTrkXUfAdIN260rVpXJXP8F9EmQGQK+Z+PAXNXZeu48QF/E0BerCXEQF/1W3GgXWAdh3NGe+Mdc2Crk3j4vh3ClAg3SLSdZy4OH4cH3NKQcMTFoF0HScu4Ad8zCkFDU8Y8F2p/htPWxgaJ7U6FAwn7ighpc+mFxlXIJonzYfON+M1itZrGMWNiahmlAs6X3m5pQI5cQ4Ay1i6yYB/3gpQqGYcBqeG1Bji+I3LrVLY0YeJwkeNptqLO17RiMQG/FUlCkAcf8PK1UwZT2BWYgJ+wEe8uI7tjkdJCkFPBf/oL6kJuaNQ11VowaiQz7xfIMHMO4zS6tB83DiXAXf9/fjDf5Y8ehF30wG/roiirWMMLhNKnu5aZHzAv7jNIkVx7zBx/LbKAT/gtykZEBHH7xAxrU5anQ5sTodYv3ronGIKs/vZpjm6+RzlSeekvbfy8wMaS+NmPAg4taEHoVoj4K8KUkip4FWfPhq06tDQdWhcwL9TgJ5Yxw3j+JsCCqQ0lsYF/ICPTZ9+RdLqnEtK9VEOZ1qdtDoPvFDQlC8+NQHaHVD3mdLj08WVk3jFxmkRlP6Z5q3AQvSlkC5zjV6b7pnsY0SM0rZZju8kqxRBKe4+JyoGjVMAogfM0VHRRtG8Nycln941qnFKDQP+qqIiGgUo4I9G+3w+pYYBP+APpTOO35CTuuYyjSMmdQEal1Zn3guMewKVGh7+XZ3Rn2gHXEUMZePkLlCtTfW5Iu4qfa56oLiqhgH/pNUJ+HpPrWhGDxM1TqWLCPgBX/lofItVQHPgdcZWmwv4AT/gfylAe1OqGD2xdL4R77jp8W8KOLV5a8env3N7xaVDKcIV+SgH8Vlm4cJHdVTWUXQjsVRbhR/8G1hUIHphOYpTEr8iH1KUZ38lFSAdgJR1FN1IrJN32ePH8Yn07RhanPZMWguiAElzpHF0L24czUcxzji+W5V1PC0OXY4WMeBvilLNlhEBn5LYiAv4g4Q8mIZqOwX8edtqz0z7eRrn3EOqbKnoikPv16IAtBXtc8n9vI7eVY5X6YMdXxFzdCwVmMYF/IAf8FcGHKdZpojja5fyOD74PFAnp3Fx/Dh+HD+OD6znOMQxmjg+kJ0KTOPi+HF8679zC5iVQqo+2em/6UsIjav6eZqjcxe4KsejotG1lRrSOZ18KgAD/qqMUgQlljxJ0i+Qsq4SS9yJzhfwiZq7GEU0Or1TsMrF6ZzUqQL+poDz5aRjl9Xi+HF85CH0sCvmReekBhLw75Si4tK49Pjn7vzW4NMLGLKKIsh5gVmmdMbTsa/W6ih604NMa03dlM7nPme66+BfPVREJ7EUPkUgKgZdO+CP6b0JD18xVx2wgP9GPb4CUBz/XK2AH/DRebrKia9aJ+AH/ID/pQD9TCLFin+5SPtst8d3HISOrXIcfeeg7/3VyxOtF62Nqw/Nhz5nKvpgx3c2SQ8SBUV51aF50xyVYtH9UNCUwtK16Zwz9FG03MfS/VX1D/gdrQ4tmFMcZ2wcv/0aFfAD/sM5pl8g+jWlRqHEucYQ8AN+wH/Vy63jLNQZaK/rXmSpqzl7Vlodug7t8Wf8kwWnhpXeb+H4tDjO7T/gnx/JgE8t6y5uhmg0DcctlAPnrOMeOufA0z3OqKE7J2XgKC6Of6IehUJpLWixlLUDPlV1iwv4AR9R47qz81I0+mu6bPhHge8UhxZmEU2J3VPljFVaIgqL+2XZ56RcbtGJK4KcWgf8O1EVIJXYgH9T4IoDptQljr+SqYimxAb8gP+NAQUe6hbO58/Nx2kt6Ni0OpsCTq3T6qTVuaQFeetWx7mIUKdynK/KT3Fy0pYsMTRP+qUara07H90frWuVD3Vtuh8lb9zj08VpnAMkXaNyGipQBa47Xsn/GbF0fwG/ozoBv0O0i4YE/IlCB/yJ4ppTB3xTwLPhAX+iuObU/yz4pm7dwx3B3X7+qn7V3SMVd/TF2s17tNG5+3uLv53pFNspmCIufaFw8qE6VCagjN/HunkH/BP131ncgH9+rAJ+wHeMF49VvlZk0nc2paP9pdU5qboCTxw/jk8M5DDmnV0l4L8X+P8H+o8XEfNPBksAAAAASUVORK5CYII=" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload></a></p>
  143. <p>测试用验证码文件</p>
  144. <p><img src="https://img-cdn.limour.top/blog_wp/2020/07/%E5%BE%AE%E4%BF%A1%E5%9B%BE%E7%89%87_20200702203134.png" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload></p>
  145. <p>与百度OCR的对比,第一个是tesseractOCR</p>
  146. <figure class="highlight haskell"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br></pre></td><td class="code"><pre><code class="hljs haskell"><span class="hljs-meta">#tesOCR.py</span><br><span class="hljs-title">from</span> <span class="hljs-type">PIL</span> <span class="hljs-keyword">import</span> Image<br><span class="hljs-keyword">import</span> pytesseract<br><span class="hljs-title">from</span> io <span class="hljs-keyword">import</span> BytesIO<br><br><span class="hljs-title">config</span> = <span class="hljs-string">&quot;--psm 8 --oem 0 -c tessedit_char_whitelist=abcdefghijklmnopqrstuvwxyz&quot;</span><br><br></code></pre></td></tr></table></figure>
  147. <figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br></pre></td><td class="code"><pre><code class="hljs python"><span class="hljs-comment">#baiduOCR.py</span><br><span class="hljs-keyword">from</span> aip <span class="hljs-keyword">import</span> AipOcr<br><span class="hljs-string">&quot;&quot;&quot; 你的 APPID AK SK &quot;&quot;&quot;</span><br>APP_ID = <span class="hljs-string">&#x27;&#x27;</span><br>API_KEY = <span class="hljs-string">&#x27;&#x27;</span><br>SECRET_KEY = <span class="hljs-string">&#x27;&#x27;</span><br><br>client = AipOcr(APP_ID, API_KEY, SECRET_KEY)<br>options = &#123;&#125;<br>options[<span class="hljs-string">&quot;language_type&quot;</span>] = <span class="hljs-string">&quot;ENG&quot;</span><br>options[<span class="hljs-string">&quot;detect_direction&quot;</span>] = <span class="hljs-string">&quot;true&quot;</span><br>options[<span class="hljs-string">&quot;detect_language&quot;</span>] = <span class="hljs-string">&quot;true&quot;</span><br><br></code></pre></td></tr></table></figure>
  148. <figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br></pre></td><td class="code"><pre><code class="hljs python"><span class="hljs-comment">#test.py</span><br><span class="hljs-keyword">import</span> os, random<br><span class="hljs-keyword">class</span> <span class="hljs-title class_">Fileset</span>(<span class="hljs-title class_ inherited__">list</span>):<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__init__</span>(<span class="hljs-params">self, name, ext=<span class="hljs-string">&#x27;&#x27;</span>, _read=<span class="hljs-literal">None</span>, root=<span class="hljs-literal">None</span></span>):<br> <span class="hljs-keyword">if</span> <span class="hljs-built_in">isinstance</span>(name, <span class="hljs-built_in">str</span>) :<br> self.root = os.path.join(root <span class="hljs-keyword">or</span> os.getcwd(), name)<br> self.extend(f <span class="hljs-keyword">for</span> f <span class="hljs-keyword">in</span> os.listdir(self.root) <span class="hljs-keyword">if</span> f.endswith(ext))<br> self._read = _read<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__getitem__</span>(<span class="hljs-params">self, index</span>):<br> <span class="hljs-keyword">if</span> <span class="hljs-built_in">isinstance</span>(index, <span class="hljs-built_in">int</span>):<span class="hljs-comment"># index是索引</span><br> <span class="hljs-keyword">return</span> os.path.join(self.root, <span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">else</span>:<span class="hljs-comment"># index是切片</span><br> fileset = Fileset(<span class="hljs-literal">None</span>)<br> fileset.root = self.root<br> fileset._read = self._read<br> fileset.extend(<span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">return</span> fileset<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">getFileName</span>(<span class="hljs-params">self, index</span>):<br> fname, ext = os.path.splitext(<span class="hljs-built_in">super</span>().__getitem__(index))<br> <span class="hljs-keyword">return</span> fname<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__iter__</span>(<span class="hljs-params">self</span>):<br> <span class="hljs-keyword">return</span> (os.path.join(self.root, f) <span class="hljs-keyword">for</span> f <span class="hljs-keyword">in</span> <span class="hljs-built_in">super</span>().__iter__())<br> <span class="hljs-keyword">def</span> <span class="hljs-title function_">__call__</span>(<span class="hljs-params">self</span>):<br> retn = random.choice(self)<br> <span class="hljs-keyword">if</span> self._read: <span class="hljs-keyword">return</span> self._read(retn)<br> <span class="hljs-keyword">else</span>: <span class="hljs-keyword">return</span> retn<br><span class="hljs-keyword">def</span> <span class="hljs-title function_">fopen</span>(<span class="hljs-params">path</span>):<br> <span class="hljs-keyword">with</span> <span class="hljs-built_in">open</span>(path, <span class="hljs-string">&#x27;rb&#x27;</span>) <span class="hljs-keyword">as</span> f:<br> <span class="hljs-keyword">return</span> f.read()<br>sample = Fileset(<span class="hljs-string">&#x27;Captcha&#x27;</span>, <span class="hljs-string">&#x27;.jpg&#x27;</span>, fopen)<br><br>OCR = <span class="hljs-built_in">input</span>(<span class="hljs-string">&#x27;请选择验证码识别方式(默认为tesseract, 1为百度OCR):&#x27;</span>)<br><span class="hljs-keyword">if</span> <span class="hljs-keyword">not</span> OCR: <span class="hljs-keyword">from</span> tesOCR <span class="hljs-keyword">import</span> tesOCR <span class="hljs-keyword">as</span> OCR<br><span class="hljs-keyword">elif</span> OCR == <span class="hljs-string">&quot;1&quot;</span> : <span class="hljs-keyword">from</span> baiduOCR <span class="hljs-keyword">import</span> BaiduOCR <span class="hljs-keyword">as</span> OCR<br><span class="hljs-keyword">from</span> baiduOCR <span class="hljs-keyword">import</span> BaiduOCR<br><br></code></pre></td></tr></table></figure>
  149. </div>
  150. <hr/>
  151. <div>
  152. <div class="post-metas my-3">
  153. <div class="post-meta mr-3 d-flex align-items-center">
  154. <i class="iconfont icon-category"></i>
  155. <span class="category-chains">
  156. <span class="category-chain">
  157. <a href="/categories/Python%E7%BB%83%E4%B9%A0/" class="category-chain-item">Python练习</a>
  158. </span>
  159. </span>
  160. </div>
  161. <div class="post-meta">
  162. <i class="iconfont icon-tags"></i>
  163. <a href="/tags/Python/" class="print-no-link">#Python</a>
  164. <a href="/tags/tesseract/" class="print-no-link">#tesseract</a>
  165. <a href="/tags/Captcha/" class="print-no-link">#Captcha</a>
  166. <a href="/tags/OCR/" class="print-no-link">#OCR</a>
  167. </div>
  168. </div>
  169. <div class="license-box my-3">
  170. <div class="license-title">
  171. <div>pytesseract测试</div>
  172. <div>https://b.limour.top/297.html</div>
  173. </div>
  174. <div class="license-meta">
  175. <div class="license-meta-item">
  176. <div>Author</div>
  177. <div>Limour</div>
  178. </div>
  179. <div class="license-meta-item license-meta-date">
  180. <div>Posted on</div>
  181. <div>July 2, 2020</div>
  182. </div>
  183. <div class="license-meta-item">
  184. <div>Licensed under</div>
  185. <div>
  186. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  187. <span class="hint--top hint--rounded" aria-label="BY - Attribution">
  188. <i class="iconfont icon-by"></i>
  189. </span>
  190. </a>
  191. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  192. <span class="hint--top hint--rounded" aria-label="NC - Non-commercial">
  193. <i class="iconfont icon-nc"></i>
  194. </span>
  195. </a>
  196. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  197. <span class="hint--top hint--rounded" aria-label="SA - Share-alike">
  198. <i class="iconfont icon-sa"></i>
  199. </span>
  200. </a>
  201. </div>
  202. </div>
  203. </div>
  204. <div class="license-icon iconfont"></div>
  205. </div>
  206. <div class="post-prevnext my-3">
  207. <article class="post-prev col-6">
  208. <a href="/309.html" title="LSTM应用于验证码识别">
  209. <i class="iconfont icon-arrowleft"></i>
  210. <span class="hidden-mobile">LSTM应用于验证码识别</span>
  211. <span class="visible-mobile">Previous</span>
  212. </a>
  213. </article>
  214. <article class="post-next col-6">
  215. <a href="/288.html" title="学年总结-有机化学">
  216. <span class="hidden-mobile">学年总结-有机化学</span>
  217. <span class="visible-mobile">Next</span>
  218. <i class="iconfont icon-arrowright"></i>
  219. </a>
  220. </article>
  221. </div>
  222. </div>
  223. <article id="comments" lazyload>
  224. <div id="waline"></div>
  225. <script type="text/javascript">
  226. Fluid.utils.loadComments('#waline', function() {
  227. Fluid.utils.createCssLink('https://cdn.staticfile.org/waline/2.15.5/waline.min.css')
  228. Fluid.utils.createScript('https://cdn.staticfile.org/waline/2.15.5/waline.min.js', function() {
  229. var options = Object.assign(
  230. {"serverURL":"https://comments.limour.top","path":"window.location.pathname","meta":["nick","mail","link"],"requiredMeta":["nick"],"lang":"zh-CN","emoji":["https://jscdn.limour.top/gh/walinejs/emojis/weibo"],"dark":"html[data-user-color-scheme=\"dark\"]","wordLimit":0,"pageSize":10},
  231. {
  232. el: '#waline',
  233. path: window.location.pathname
  234. }
  235. )
  236. Waline.init(options);
  237. Fluid.utils.waitElementVisible('#waline .vcontent', () => {
  238. var imgSelector = '#waline .vcontent img:not(.vemoji)';
  239. Fluid.plugins.imageCaption(imgSelector);
  240. Fluid.plugins.fancyBox(imgSelector);
  241. })
  242. });
  243. });
  244. </script>
  245. <noscript>Please enable JavaScript to view the comments</noscript>
  246. </article>
  247. </article>
  248. </div>
  249. </div>
  250. </div>
  251. <div class="side-col d-none d-lg-block col-lg-2">
  252. <aside class="sidebar" style="margin-left: -1rem">
  253. <div id="toc">
  254. <p class="toc-header">
  255. <i class="iconfont icon-list"></i>
  256. <span>Table of Contents</span>
  257. </p>
  258. <div class="toc-body" id="toc-body"></div>
  259. </div>
  260. </aside>
  261. </div>
  262. </div>
  263. </div>
  264. <a id="scroll-top-button" aria-label="TOP" href="#" role="button">
  265. <i class="iconfont icon-arrowup" aria-hidden="true"></i>
  266. </a>
  267. <div class="modal fade" id="modalSearch" tabindex="-1" role="dialog" aria-labelledby="ModalLabel"
  268. aria-hidden="true">
  269. <div class="modal-dialog modal-dialog-scrollable modal-lg" role="document">
  270. <div class="modal-content">
  271. <div class="modal-header text-center">
  272. <h4 class="modal-title w-100 font-weight-bold">Search</h4>
  273. <button type="button" id="local-search-close" class="close" data-dismiss="modal" aria-label="Close">
  274. <span aria-hidden="true">&times;</span>
  275. </button>
  276. </div>
  277. <div class="modal-body mx-3">
  278. <div class="md-form mb-5">
  279. <input type="text" id="local-search-input" class="form-control validate">
  280. <label data-error="x" data-success="v" for="local-search-input">Keyword</label>
  281. </div>
  282. <div class="list-group" id="local-search-result"></div>
  283. </div>
  284. </div>
  285. </div>
  286. </div>
  287. </main>
  288. <footer>
  289. <div class="footer-inner">
  290. <div class="footer-content">
  291. <a target="_blank" rel="nofollow noopener" href="http://www.beian.gov.cn/portal/registerSystemInfo?recordcode=43130202000203"><img src="https://img.limour.top/2023/08/27/64eadeb81d6a0.webp" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload>湘公网安备 43130202000203号 </a> <a target="_blank" rel="nofollow noopener" href="https://beian.miit.gov.cn/">湘ICP备20008299号 </a> <a target="_blank" rel="nofollow noopener" href="https://icp.gov.moe/?keyword=20210128">萌ICP备20210128号</a> <br> <a href="https://www.foreverblog.cn/" target="_blank"> <img src="https://img.foreverblog.cn/logo_en_default.png" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload alt="" style="width:auto;height:24px"> </a> <br> <a href="https://hexo.io" target="_blank" rel="nofollow noopener"><span>Hexo</span></a> <i class="iconfont icon-love"></i> <a href="https://github.com/fluid-dev/hexo-theme-fluid" target="_blank" rel="nofollow noopener"><span>Fluid</span></a> <i class="iconfont icon-love"></i> <a href="https://github.com/limour-blog/archives-b" target="_blank" rel="nofollow noopener"><span>SRC</span></a>
  292. </div>
  293. </div>
  294. </footer>
  295. <!-- Scripts -->
  296. <script src="https://jscdn.limour.top/npm/nprogress@0.2.0/nprogress.min.js" ></script>
  297. <link rel="stylesheet" href="https://jscdn.limour.top/npm/nprogress@0.2.0/nprogress.min.css" />
  298. <script>
  299. NProgress.configure({"showSpinner":false,"trickleSpeed":100})
  300. NProgress.start()
  301. window.addEventListener('load', function() {
  302. NProgress.done();
  303. })
  304. </script>
  305. <script src="https://jscdn.limour.top/npm/jquery@3.6.4/dist/jquery.min.js" ></script>
  306. <script src="https://jscdn.limour.top/npm/bootstrap@4.6.1/dist/js/bootstrap.min.js" ></script>
  307. <script src="/js/events.js" ></script>
  308. <script src="/js/plugins.js" ></script>
  309. <script src="https://lib.baomitu.com/typed.js/2.0.12/typed.min.js" ></script>
  310. <script>
  311. (function (window, document) {
  312. var typing = Fluid.plugins.typing;
  313. var subtitle = document.getElementById('subtitle');
  314. if (!subtitle || !typing) {
  315. return;
  316. }
  317. var text = subtitle.getAttribute('data-typed-text');
  318. typing(text);
  319. })(window, document);
  320. </script>
  321. <script src="/js/img-lazyload.js" ></script>
  322. <script>
  323. Fluid.utils.createScript('https://jscdn.limour.top/npm/tocbot@4.20.1/dist/tocbot.min.js', function() {
  324. var toc = jQuery('#toc');
  325. if (toc.length === 0 || !window.tocbot) { return; }
  326. var boardCtn = jQuery('#board-ctn');
  327. var boardTop = boardCtn.offset().top;
  328. window.tocbot.init(Object.assign({
  329. tocSelector : '#toc-body',
  330. contentSelector : '.markdown-body',
  331. linkClass : 'tocbot-link',
  332. activeLinkClass : 'tocbot-active-link',
  333. listClass : 'tocbot-list',
  334. isCollapsedClass: 'tocbot-is-collapsed',
  335. collapsibleClass: 'tocbot-is-collapsible',
  336. scrollSmooth : true,
  337. includeTitleTags: true,
  338. headingsOffset : -boardTop,
  339. }, CONFIG.toc));
  340. if (toc.find('.toc-list-item').length > 0) {
  341. toc.css('visibility', 'visible');
  342. }
  343. Fluid.events.registerRefreshCallback(function() {
  344. if ('tocbot' in window) {
  345. tocbot.refresh();
  346. var toc = jQuery('#toc');
  347. if (toc.length === 0 || !tocbot) {
  348. return;
  349. }
  350. if (toc.find('.toc-list-item').length > 0) {
  351. toc.css('visibility', 'visible');
  352. }
  353. }
  354. });
  355. });
  356. </script>
  357. <script src=https://lib.baomitu.com/clipboard.js/2.0.11/clipboard.min.js></script>
  358. <script>Fluid.plugins.codeWidget();</script>
  359. <script>
  360. Fluid.utils.createScript('https://jscdn.limour.top/npm/anchor-js@4.3.1/anchor.min.js', function() {
  361. window.anchors.options = {
  362. placement: CONFIG.anchorjs.placement,
  363. visible : CONFIG.anchorjs.visible
  364. };
  365. if (CONFIG.anchorjs.icon) {
  366. window.anchors.options.icon = CONFIG.anchorjs.icon;
  367. }
  368. var el = (CONFIG.anchorjs.element || 'h1,h2,h3,h4,h5,h6').split(',');
  369. var res = [];
  370. for (var item of el) {
  371. res.push('.markdown-body > ' + item.trim());
  372. }
  373. if (CONFIG.anchorjs.placement === 'left') {
  374. window.anchors.options.class = 'anchorjs-link-left';
  375. }
  376. window.anchors.add(res.join(', '));
  377. Fluid.events.registerRefreshCallback(function() {
  378. if ('anchors' in window) {
  379. anchors.removeAll();
  380. var el = (CONFIG.anchorjs.element || 'h1,h2,h3,h4,h5,h6').split(',');
  381. var res = [];
  382. for (var item of el) {
  383. res.push('.markdown-body > ' + item.trim());
  384. }
  385. if (CONFIG.anchorjs.placement === 'left') {
  386. anchors.options.class = 'anchorjs-link-left';
  387. }
  388. anchors.add(res.join(', '));
  389. }
  390. });
  391. });
  392. </script>
  393. <script>
  394. Fluid.utils.createScript('https://lib.baomitu.com/fancybox/3.5.7/jquery.fancybox.min.js', function() {
  395. Fluid.plugins.fancyBox();
  396. });
  397. </script>
  398. <script>Fluid.plugins.imageCaption();</script>
  399. <script src="/js/local-search.js" ></script>
  400. <!-- 主题的启动项,将它保持在最底部 -->
  401. <!-- the boot of the theme, keep it at the bottom -->
  402. <script src="/js/boot.js" ></script>
  403. <noscript>
  404. <div class="noscript-warning">Blog works best with JavaScript enabled</div>
  405. </noscript>
  406. <!-- hexo injector body_end start -->
  407. <script defer src="/theme-inject/timeliness.js"></script>
  408. <!-- hexo injector body_end end --></body>
  409. </html>