使用百度api进行身份证照片文字识别
首先需要登陆百度ai平台进行注册 http://ai.baidu.com 进入控制台创建应用,如下图:
创建完毕后就有AppID API Key Secret Key,通过这三个标识我们就能获取到所谓的鉴权token了。
下面开始正题
导入依赖
<dependency>
<groupId>com.google.code.gson</groupId>
<artifactId>gson</artifactId>
<version>2.8.2</version>
</dependency>
<dependency>
<groupId>com.baidu.aip</groupId>
<artifactId>java-sdk</artifactId>
<version>4.1.0</version>
</dependency>
需要工具类,下载的链接分别是
/**
* 重要提示代码中所需工具类
* FileUtil,Base64Util,HttpUtil,GsonUtils请从
* https://ai.baidu.com/file/658A35ABAB2D404FBF903F64D47C1F72
* https://ai.baidu.com/file/C8D81F3301E24D2892968F09AE1AD6E2
* https://ai.baidu.com/file/544D677F5D4E4F17B4122FBD60DB82B3
* https://ai.baidu.com/file/470B3ACCA3FE43788B5A963BF0B625F3
* 下载
*/
获取token的代码和识别的例子如下,接口调用次数在控制台我们可以看到,如下:
Test003.java
import com.baidu.aip.ocr.AipOcr;
import com.baidu.aip.util.Base64Util;
import org.json.JSONObject;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import java.net.URLEncoder;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
/**
* @Author: haohaowang
* @Desc
* @Date: 2019/5/9 17:21
*/
public class Test003 {
//设置APPID/AK/SK
public static final String APP_ID = "xxx";
public static final String API_KEY = "xxx";
public static final String SECRET_KEY = "xxxx";
/**
* 重要提示代码中所需工具类
* FileUtil,Base64Util,HttpUtil,GsonUtils请从
* https://ai.baidu.com/file/658A35ABAB2D404FBF903F64D47C1F72
* https://ai.baidu.com/file/C8D81F3301E24D2892968F09AE1AD6E2
* https://ai.baidu.com/file/544D677F5D4E4F17B4122FBD60DB82B3
* https://ai.baidu.com/file/470B3ACCA3FE43788B5A963BF0B625F3
* 下载
*/
public static void main(String[] args) {
// 身份证识别url
String idcardIdentificate = "https://aip.baidubce.com/rest/2.0/ocr/v1/idcard";
// 本地图片路径
String filePath = "D:\\cd.jpg";
try {
byte[] imgData = FileUtil.readFileByBytes(filePath);
String imgStr = Base64Util.encode(imgData);
// 识别身份证正面id_card_side=front;识别身份证背面id_card_side=back;
String params = "id_card_side=front&" + URLEncoder.encode("image", "UTF-8") + "="
+ URLEncoder.encode(imgStr, "UTF-8");
/**
* 线上环境access_token有过期时间, 客户端可自行缓存,过期后重新获取。
*/
String accessToken = getAuth();
String result = HttpUtil.post(idcardIdentificate, accessToken, params);
System.out.println(result);
} catch (Exception e) {
e.printStackTrace();
}
}
public static String getAuth() {
// 官网获取的 API Key 更新为你注册的
String clientId = API_KEY;
// 官网获取的 Secret Key 更新为你注册的
String clientSecret = SECRET_KEY;
return getAuth(clientId, clientSecret);
}
/**
* 获取API访问token
* 该token有一定的有效期,需要自行管理,当失效时需重新获取.
* @param ak - 百度云官网获取的 API Key
* @param sk - 百度云官网获取的 Securet Key
* @return assess_token 示例:
* "24.460da4889caad24cccdb1fea17221975.2592000.1491995545.282335-1234567"
*/
public static String getAuth(String ak, String sk) {
// 获取token地址
String authHost = "https://aip.baidubce.com/oauth/2.0/token?";
String getAccessTokenUrl = authHost
// 1. grant_type为固定参数
+ "grant_type=client_credentials"
// 2. 官网获取的 API Key
+ "&client_id=" + ak
// 3. 官网获取的 Secret Key
+ "&client_secret=" + sk;
try {
URL realUrl = new URL(getAccessTokenUrl);
// 打开和URL之间的连接
HttpURLConnection connection = (HttpURLConnection) realUrl.openConnection();
connection.setRequestMethod("GET");
connection.connect();
// 获取所有响应头字段
Map<String, List<String>> map = connection.getHeaderFields();
// 遍历所有的响应头字段
for (String key : map.keySet()) {
System.err.println(key + "--->" + map.get(key));
}
// 定义 BufferedReader输入流来读取URL的响应
BufferedReader in = new BufferedReader(new InputStreamReader(connection.getInputStream()));
String result = "";
String line;
while ((line = in.readLine()) != null) {
result += line;
}
/**
* 返回结果示例
*/
System.err.println("result:" + result);
JSONObject jsonObject = new JSONObject(result);
String access_token = jsonObject.getString("access_token");
return access_token;
} catch (Exception e) {
System.err.printf("获取token失败!");
e.printStackTrace(System.err);
}
return null;
}
}
识别的结果(部分内容隐藏):
{
"log_id": 2372062689588418057,
"words_result_num": 6,
"direction": 1,
"image_status": "normal",
"words_result": {
"住址": {
"location": {
"width": 364,
"top": 2342,
"height": 1072,
"left": 1449
},
"words": "xxxxxxxxxxxx"
},
"出生": {
"location": {
"width": 90,
"top": 2547,
"height": 838,
"left": 1230
},
"words": "xxxxxxx"
},
"姓名": {
"location": {
"width": 118,
"top": 3053,
"height": 336,
"left": 801
},
"words": "xxxxxx"
},
"公民身份号码": {
"location": {
"width": 96,
"top": 1539,
"height": 1441,
"left": 1986
},
"words": "xxxxxxxxxxxxxxx"
},
"性别": {
"location": {
"width": 84,
"top": 3311,
"height": 74,
"left": 1037
},
"words": "男"
},
"民族": {
"location": {
"width": 80,
"top": 2799,
"height": 70,
"left": 1031
},
"words": "汉"
}
}
}
正文到此结束(点击广告是对作者最大的支持)