我想从位图中提取一个数字。我正在使用tess-two
库,但它无法正确识别。
示例代码:
@Override
public void onClick(View v) {
switch (v.getId()){
case R.id.b2:
InputStream is = null;
try {
is = getApplicationContext().getAssets().open("zak.jpeg");
} catch (IOException e1) {
e1.printStackTrace();
}
final Drawable drw = Drawable.createFromStream(is, null);
bmp = ((BitmapDrawable) drw).getBitmap();
TessBaseAPI baseApi = new TessBaseAPI();
bmp =BITMAP_RESIZER(bmp,bmp.getWidth(),bmp.getHeight());
bmp =convertToGrayscale(bmp);
bmp =RemoveNoise(bmp);
iv.setImageBitmap(bmp);
baseApi.init("/mnt/sdcard/Download/", "eng");
baseApi.setVariable(TessBaseAPI.VAR_CHAR_WHITELIST,"1234567890");
baseApi.setVariable(TessBaseAPI.VAR_CHAR_BLACKLIST,"!@#$%^&* ()_+=-[]}{" +";:'\"\\|~`,./<>?");
baseApi.setDebug(true);
baseApi.setImage(bmp);
String recognizedText = baseApi.getUTF8Text();
tv.setText(" numbers : "+recognizedText.trim());
Log.d("karim", recognizedText);
baseApi.end();
break;
将位图转换为灰度的方法:
public static Bitmap convertToGrayscale(Bitmap bmpOriginal) {
int width, height;
height = bmpOriginal.getHeight();
width = bmpOriginal.getWidth();
Bitmap bmpGrayscale = Bitmap.createBitmap(width, height, Bitmap.Config.ARGB_8888);
Canvas c = new Canvas(bmpGrayscale);
Paint paint = new Paint();
ColorMatrix cm = new ColorMatrix();
cm.setSaturation(0);
ColorMatrixColorFilter f = new ColorMatrixColorFilter(cm);
paint.setColorFilter(f);
c.drawBitmap(bmpOriginal, 0, 0, paint);
return bmpGrayscale;
}
从位图中删除噪音的方法:
public Bitmap RemoveNoise(Bitmap bmap) {
for (int x = 0; x < bmap.getWidth(); x++) {
for (int y = 0; y < bmap.getHeight(); y++) {
int pixel = bmap.getPixel(x, y);
int R = Color.red(pixel);
int G = Color.green(pixel);
int B = Color.blue(pixel);
if (R < 162 && G < 162 && B < 162)
bmap.setPixel(x, y, Color.BLACK);
}
}
for (int x = 0; x < bmap.getWidth(); x++) {
for (int y = 0; y < bmap.getHeight(); y++) {
int pixel = bmap.getPixel(x, y);
int R = Color.red(pixel);
int G = Color.green(pixel);
int B = Color.blue(pixel);
if (R > 162 && G > 162 && B > 162)
bmap.setPixel(x, y, Color.WHITE);
}
}
return bmap;
}
调整位图大小的方法:
public Bitmap BITMAP_RESIZER(Bitmap bitmap,int newWidth,int newHeight)
{
Bitmap scaledBitmap = Bitmap.createBitmap(newWidth, newHeight, Config.ARGB_8888);
float ratioX = newWidth / (float) bitmap.getWidth();
float ratioY = newHeight / (float) bitmap.getHeight();
float middleX = newWidth / 2.0f;
float middleY = newHeight / 2.0f;
Matrix scaleMatrix = new Matrix();
scaleMatrix.setScale(ratioX, ratioY, middleX, middleY);
Canvas canvas = new Canvas(scaledBitmap);
canvas.setMatrix(scaleMatrix);
canvas.drawBitmap(bitmap, middleX - bitmap.getWidth() / 2, middleY - bitmap.getHeight() / 2, new Paint(Paint.FILTER_BITMAP_FLAG));
return scaledBitmap;
}
如何解决此问题?
答案 0 :(得分:1)
也许这有些晚了但是如果我理解正确你想要的只是数字作为输出。
您提供的白名单是可以的,但tesseract会强制将字母与白名单中指定的数字相匹配。没有办法让它省略某些字符,但你可以做的是为整个字母设置白名单,然后手动将字母与代码中的数字分开。
答案 1 :(得分:0)
baseApi.SetVariable(&#34; tessedit_char_whitelist&#34;,&#34; 0123456789&#34;);