我正在尝试从扫描的文档中获取文本。但是我遇到了错误“ OCR运行时错误”。我还对大型文档在web.config中进行了更改...如果您有任何解决方案,请帮助我...谢谢大家。
<httpRuntime targetFramework="4.5.2" maxRequestLength="200000"
executionTimeout="999999" requestLengthDiskThreshold="200000"/>
以下是我在代码段后面的代码:
protected void Button1_Click(object sender, EventArgs e)
{
string filePath = Server.MapPath("~/Uploads/" + Path.GetFileName(FileUpload1.PostedFile.FileName));
FileUpload1.SaveAs(filePath);
string extractText = this.ExtractTextFromImage(filePath);
string[] lines = extractText.Split(
new[] { "\r\n", "\r", "\n" },
StringSplitOptions.None
);
Label1.Text = extractText.Replace(Environment.NewLine, "<br />");
var FirstName = lines[2].ToString();
var FatherName = lines[3].ToString();
var DOB = lines[4].ToString();
var PermenantAccountNumber = lines[6].ToString();
string s = DOB;
string t = "/";
s = s.Remove(2, t.Length);
s = s.Insert(2, t);
var DateOfBirth = s;
boObj.FirstName = FirstName;
boObj.MiddleName = FatherName;
boObj.DateOfBirth = DateOfBirth;
boObj.AccountNumber = PermenantAccountNumber;
blObj.SubmitBAL(boObj);
}
private string ExtractTextFromImage(string filePath)
{
Document modiDocument1 = new Document();
modiDocument1.Create(filePath);
modiDocument1.OCR(MiLANGUAGES.miLANG_ENGLISH); //Getting Error here
MODI.Image modiImage = (modiDocument1.Images[0] as MODI.Image);
string extractedText = modiImage.Layout.Text;
modiDocument1.Close();
return extractedText;
}