爬虫中遇到登录验证码,java 如何识别图片验证码
https://blog.csdn.net/persistencegoing/article/details/84376427import java.awt.image.BufferedImage;import java.io.File;import java.io.FileOutputStream;import java.io.IOException;import java.io.I...
https://blog.csdn.net/persistencegoing/article/details/84376427
import java.awt.image.BufferedImage;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.Date;
import javax.imageio.ImageIO;
import org.apache.commons.httpclient.HttpClient;
import org.apache.commons.httpclient.HttpStatus;
import org.apache.commons.httpclient.methods.GetMethod;
import org.apache.commons.io.IOUtils;
import com.asprise.ocr.Ocr;
import com.asprise.util.ocr.OCR;
public class ReadImg {
public static void main(String[] args) throws IOException {
HttpClient httpClient = new HttpClient();
GetMethod getMethod = new GetMethod(“http://dz.bjjtgl.gov.cn/service/checkCode.do”);
// GetMethod getMethod = new GetMethod(“https://dynamic.12306.cn/otsweb/passCodeAction.do?rand=sjrand”);
int statusCode = httpClient.executeMethod(getMethod);
if (statusCode != HttpStatus.SC_OK) {
System.err.println("Method failed: " + getMethod.getStatusLine());
return ;
}
String picName = “F:\img\”;
File filepic=new File(picName);
if(!filepic.exists())
filepic.mkdir();
File filepicF=new File(picName+new Date().getTime() + “.jpg”);
InputStream inputStream = getMethod.getResponseBodyAsStream();
OutputStream outStream = new FileOutputStream(filepicF);
IOUtils.copy(inputStream, outStream);
outStream.close();
Ocr.setUp(); // one time setup
Ocr ocr = new Ocr(); // create a new OCR engine
ocr.startEngine("eng", Ocr.SPEED_FASTEST); // English
String s = ocr.recognize(new File[] {filepicF},Ocr.RECOGNIZE_TYPE_TEXT, Ocr.OUTPUT_FORMAT_PLAINTEXT);
System.out.println("Result: " + s);
System.out.println("图片文字为:" + s.replace(",", "").replace("i", "1").replace(" ", "").replace("'", "").replace("o", "0").replace("O", "0").replace("g", "6").replace("B", "8").replace("s", "5").replace("z", "2"));
// ocr more images here ...
ocr.stopEngine();
}
}
注意:主要的jar包
1.aocr.jar – 去Asprise官网下载最新jar包 http://asprise.com/royalty-free-library/java-ocr-for-windows-mac-linux-download.html
2.commons-codec.jar
3.commons-httpclient-3.1.jar
4.commons-io.jar
5.commons-logging-1.0.4.jar
希望大家关注我一波,防止以后迷路,有需要的可以加群讨论互相学习java ,学习路线探讨,经验分享与java求职
群号:721 515 304
魔乐社区(Modelers.cn) 是一个中立、公益的人工智能社区,提供人工智能工具、模型、数据的托管、展示与应用协同服务,为人工智能开发及爱好者搭建开放的学习交流平台。社区通过理事会方式运作,由全产业链共同建设、共同运营、共同享有,推动国产AI生态繁荣发展。
更多推荐


所有评论(0)