/**
* Copyright @ 2012 Quan Nguyen
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not
* use this file except in compliance with the License. You may obtain a copy of
* the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations under
* the License.
*/
package net.sourceforge.tess4j;
import java.nio.ByteBuffer;
import java.nio.DoubleBuffer;
import java.nio.FloatBuffer;
import java.nio.IntBuffer;
import com.sun.jna.Library;
import com.sun.jna.Native;
import com.sun.jna.Pointer;
import com.sun.jna.ptr.IntByReference;
import com.sun.jna.ptr.PointerByReference;
import com.ochafik.lang.jnaerator.runtime.NativeSize;
import net.sourceforge.lept4j.Boxa;
import net.sourceforge.lept4j.Pix;
import net.sourceforge.tess4j.util.LoadLibs;
/**
* A Java wrapper for <code>Tesseract OCR 3.04 API</code> using
* <code>JNA Direct Mapping</code>.
*/
public class TessAPI1 implements Library, ITessAPI {
static {
Native.register(LoadLibs.getTesseractLibName());
}
/**
* Gets the version identifier.
*
* @return the version identifier
*/
public static native String TessVersion();
/**
* Deallocates the memory block occupied by text.
*
* @param text the pointer to text
*/
public static native void TessDeleteText(Pointer text);
/**
* Deallocates the memory block occupied by text array.
*
* @param arr text array pointer reference
*/
public static native void TessDeleteTextArray(PointerByReference arr);
/**
* Deallocates the memory block occupied by integer array.
*
* @param arr int array
*/
public static native void TessDeleteIntArray(IntBuffer arr);
/* Renderer API */
public static native TessResultRenderer TessTextRendererCreate(String outputbase);
public static native TessResultRenderer TessHOcrRendererCreate(String outputbase);
public static native TessResultRenderer TessHOcrRendererCreate2(String outputbase, int font_info);
public static native TessResultRenderer TessPDFRendererCreate(String outputbase, String datadir);
public static native TessResultRenderer TessPDFRendererCreateTextonly(String outputbase, String datadir, int textonly);
public static native TessResultRenderer TessUnlvRendererCreate(String outputbase);
public static native TessResultRenderer TessBoxTextRendererCreate(String outputbase);
public static native void TessDeleteResultRenderer(TessResultRenderer renderer);
public static native void TessResultRendererInsert(TessResultRenderer renderer, TessResultRenderer next);
public static native TessResultRenderer TessResultRendererNext(TessResultRenderer renderer);
public static native int TessResultRendererBeginDocument(TessResultRenderer renderer, String title);
public static native int TessResultRendererAddImage(TessResultRenderer renderer, PointerByReference api);
public static native int TessResultRendererEndDocument(TessResultRenderer renderer);
public static native Pointer TessResultRendererExtention(TessResultRenderer renderer);
public static native Pointer TessResultRendererTitle(TessResultRenderer renderer);
public static native int TessResultRendererImageNum(TessResultRenderer renderer);
/**
* Creates an instance of the base class for all Tesseract APIs.
*
* @return the TesseractAPI instance
*/
public static native TessBaseAPI TessBaseAPICreate();
/**
* Disposes the TesseractAPI instance.
*
* @param handle the TesseractAPI instance
*/
public static native void TessBaseAPIDelete(TessBaseAPI handle);
/**
* Set the name of the input file. Needed only for training and reading a
* UNLV zone file, and for searchable PDF output.
*
* @param handle the TesseractAPI instance
* @param name name of the input file
*/
public static native void TessBaseAPISetInputName(TessBaseAPI handle, String name);
/**
* These functions are required for searchable PDF output. We need our hands
* on the input file so that we can include it in the PDF without
* transcoding. If that is not possible, we need the original image.
* Finally, resolution metadata is stored in the PDF so we need that as
* well.
*
* @param handle the TesseractAPI instance
* @return input file name
*/
public static native String TessBaseAPIGetInputName(TessBaseAPI handle);
public static native void TessBaseAPISetInputImage(TessBaseAPI handle, Pix pix);
public static native Pix TessBaseAPIGetInputImage(TessBaseAPI handle);
public static native int TessBaseAPIGetSourceYResolution(TessBaseAPI handle);
public static native String TessBaseAPIGetDatapath(TessBaseAPI handle);
/**
* Set the name of the bonus output files. Needed only for debugging.
*
* @param handle the TesseractAPI instance
* @param name name of the output file
*/
public static native void TessBaseAPISetOutputName(TessBaseAPI handle, String name);
/**
* Set the value of an internal "parameter." Supply the name of the
* parameter and the value as a string, just as you would in a config file.
* Returns false if the name lookup failed. E.g.,
* <code>SetVariable("tessedit_char_blacklist", "xyz");</code> to ignore x,
* y and z. Or <code>SetVariable("classify_bln_numeric_mode", "1");</code>
* to set numeric-only mode. <code>SetVariable</code> may be used before
* <code>Init</code>, but settings will revert to defaults on
* <code>End()</code>.<br>
* <br>
* Note: Must be called after <code>Init()</code>. Only works for non-init
* variables (init variables should be passed to <code>Init()</code>).
*
*
* @param handle the TesseractAPI instance
* @param name name of the input
* @param value variable value
* @return 1 on success
*/
public static native int TessBaseAPISetVariable(TessBaseAPI handle, String name, String value);
/**
* Get the value of an internal int parameter.
*
* @param handle the TesseractAPI instance
* @param name name of the input
* @param value pass the int buffer value
* @return 1 on success
*/
public static native int TessBaseAPIGetIntVariable(TessBaseAPI handle, String name, IntBuffer value);
/**
* Get the value of an internal bool parameter.
*
* @param handle the TesseractAPI instance
* @param name pass the name of the variable
* @param value pass the int buffer value
* @return 1 on success
*/
public static native int TessBaseAPIGetBoolVariable(TessBaseAPI handle, String name, IntBuffer value);
/**
* Get the value of an internal double parameter.
*
* @param handle the TesseractAPI instance
* @param name pass the name of the variable
* @param value pass the double buffer value
* @return 1 on success
*/
public static native int TessBaseAPIGetDoubleVariable(TessBaseAPI handle, String name, DoubleBuffer value);
/**
* Get the value of an internal string parameter.
*
* @param handle the TesseractAPI instance
* @param name pass the name of the variable
* @return the string value
*/
public static native String TessBaseAPIGetStringVariable(TessBaseAPI handle, String name);
/**
* Print Tesseract par
没有合适的资源?快使用搜索试试~ 我知道了~
java实现提取图片文字信息并生成表格
共158个文件
png:50个
class:45个
jar:28个
1星 需积分: 43 158 下载量 14 浏览量
2018-06-24
11:16:19
上传
评论 10
收藏 62.5MB ZIP 举报
温馨提示
对图片进行水印处理,利用TESS4J识别图片并提取信息生成excel表格。里面有字库文件所以占用空间较大。 说明:https://blog.csdn.net/xlantian/article/details/80789115
资源推荐
资源详情
资源评论
收起资源包目录
java实现提取图片文字信息并生成表格 (158个子文件)
api_config 27B
Tesseract.class 19KB
Tesseract1.class 18KB
ImageIOHelper.class 18KB
TessAPI1.class 12KB
TessAPI.class 12KB
PdfGsUtilities.class 8KB
LoadLibs.class 8KB
PdfBoxUtilities.class 7KB
ImageHelper.class 6KB
RP.class 5KB
ImageDeskew.class 4KB
ImageUtil.class 3KB
PdfUtilities.class 3KB
ITesseract.class 2KB
Utils.class 2KB
ITessAPI.class 2KB
LoggerConfig.class 2KB
WaterMark.class 1KB
ITesseract$RenderedFormat.class 1KB
Word.class 1KB
ITessAPI$ETEXT_DESC.class 1KB
PdfBoxUtilities$2.class 1004B
PdfGsUtilities$2.class 1000B
ITessAPI$EANYCODE_CHAR.class 892B
PdfBoxUtilities$1.class 854B
PdfGsUtilities$1.class 850B
ITessAPI$TessPolyBlockType.class 841B
LoggHelper.class 792B
ITessAPI$TessPageSegMode.class 785B
TesseractException.class 760B
ITessAPI$TimeVal.class 737B
ImageDeskew$HoughLine.class 676B
ITessAPI$TessMutableIterator.class 583B
ITessAPI$TessChoiceIterator.class 580B
ITessAPI$TessResultIterator.class 580B
ITessAPI$TessResultRenderer.class 580B
ITessAPI$TessPageIterator.class 574B
ITessAPI$TessBaseAPI.class 559B
ITessAPI$TessParagraphJustification.class 438B
ITessAPI$TessOrientation.class 421B
ITessAPI$TessPageIteratorLevel.class 421B
ITessAPI$TessWritingDirection.class 417B
ITessAPI$TessOcrEngineMode.class 411B
ITessAPI$TessTextlineOrder.class 402B
ITessAPI$CANCEL_FUNC.class 287B
.classpath 2KB
digits 38B
libtesseract3051.dll 2.73MB
hocr 22B
lept4j-1.6.4.jar 6.71MB
poi-ooxml-schemas-3.17.jar 5.65MB
xmlbeans-2.6.0.jar 2.6MB
poi-3.17.jar 2.58MB
pdfbox-2.0.9.jar 2.4MB
fontbox-2.0.9.jar 1.48MB
poi-ooxml-3.17.jar 1.41MB
itext-2.1.7.jar 1.08MB
jna-4.1.0.jar 893KB
commons-collections4-4.1.jar 734KB
jai-imageio-core-1.4.0.jar 613KB
xmlgraphics-commons-1.5.jar 588KB
log4j-1.2.17.jar 478KB
logback-core-1.2.3.jar 461KB
junit-4.12.jar 309KB
logback-classic-1.2.3.jar 284KB
commons-beanutils-1.9.2.jar 228KB
commons-io-2.6.jar 210KB
ghost4j-1.0.1.jar 176KB
jbig2-imageio-3.0.0.jar 149KB
jboss-vfs-3.2.12.Final.jar 141KB
pdfbox-tools-2.0.9.jar 71KB
commons-logging-1.2.jar 60KB
hamcrest-core-1.3.jar 44KB
slf4j-api-1.7.25.jar 40KB
log4j-over-slf4j-1.7.25.jar 23KB
jcl-over-slf4j-1.7.25.jar 16KB
jul-to-slf4j-1.7.25.jar 4KB
TessAPI1.java 55KB
TessAPI.java 52KB
ImageIOHelper.java 24KB
Tesseract.java 23KB
Tesseract1.java 22KB
ITessAPI.java 21KB
PdfGsUtilities.java 11KB
LoadLibs.java 9KB
ITesseract.java 8KB
ImageHelper.java 8KB
PdfBoxUtilities.java 7KB
PdfUtilities.java 5KB
ImageDeskew.java 5KB
ImageUtil.java 4KB
WaterMark.java 4KB
RP.java 3KB
Utils.java 2KB
Word.java 2KB
LoggerConfig.java 1KB
TesseractException.java 1KB
LoggHelper.java 1014B
50.png 1.42MB
共 158 条
- 1
- 2
资源评论
- 林宝yyds2022-09-26运行会报错 不是idea的项目 不建议下载 #运行出错
xlantian
- 粉丝: 46
- 资源: 2
上传资源 快速赚钱
- 我的内容管理 展开
- 我的资源 快来上传第一个资源
- 我的收益 登录查看自己的收益
- 我的积分 登录查看自己的积分
- 我的C币 登录后查看C币余额
- 我的收藏
- 我的下载
- 下载帮助
安全验证
文档复制为VIP权益,开通VIP直接复制
信息提交成功