原创

使用百度api进行身份证照片文字识别

首先需要登陆百度ai平台进行注册 http://ai.baidu.com 进入控制台创建应用,如下图:
file
创建完毕后就有AppID API Key Secret Key,通过这三个标识我们就能获取到所谓的鉴权token了。
下面开始正题
导入依赖

<dependency>
            <groupId>com.google.code.gson</groupId>
            <artifactId>gson</artifactId>
            <version>2.8.2</version>
        </dependency>

        <dependency>
            <groupId>com.baidu.aip</groupId>
            <artifactId>java-sdk</artifactId>
            <version>4.1.0</version>
        </dependency>

需要工具类,下载的链接分别是


    /**
     * 重要提示代码中所需工具类
     * FileUtil,Base64Util,HttpUtil,GsonUtils请从
     * https://ai.baidu.com/file/658A35ABAB2D404FBF903F64D47C1F72
     * https://ai.baidu.com/file/C8D81F3301E24D2892968F09AE1AD6E2
     * https://ai.baidu.com/file/544D677F5D4E4F17B4122FBD60DB82B3
     * https://ai.baidu.com/file/470B3ACCA3FE43788B5A963BF0B625F3
     * 下载
     */

获取token的代码和识别的例子如下,接口调用次数在控制台我们可以看到,如下:
file

Test003.java

import com.baidu.aip.ocr.AipOcr;
import com.baidu.aip.util.Base64Util;
import org.json.JSONObject;

import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import java.net.URLEncoder;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

/**
 * @Author: haohaowang
 * @Desc
 * @Date: 2019/5/9 17:21
 */
public class Test003 {



    //设置APPID/AK/SK
    public static final String APP_ID = "xxx";
    public static final String API_KEY = "xxx";
    public static final String SECRET_KEY = "xxxx";

    /**
     * 重要提示代码中所需工具类
     * FileUtil,Base64Util,HttpUtil,GsonUtils请从
     * https://ai.baidu.com/file/658A35ABAB2D404FBF903F64D47C1F72
     * https://ai.baidu.com/file/C8D81F3301E24D2892968F09AE1AD6E2
     * https://ai.baidu.com/file/544D677F5D4E4F17B4122FBD60DB82B3
     * https://ai.baidu.com/file/470B3ACCA3FE43788B5A963BF0B625F3
     * 下载
     */
    public static void main(String[] args) {
        // 身份证识别url
        String idcardIdentificate = "https://aip.baidubce.com/rest/2.0/ocr/v1/idcard";
        // 本地图片路径
        String filePath = "D:\\cd.jpg";
        try {
            byte[] imgData = FileUtil.readFileByBytes(filePath);
            String imgStr = Base64Util.encode(imgData);
            // 识别身份证正面id_card_side=front;识别身份证背面id_card_side=back;
            String params = "id_card_side=front&" + URLEncoder.encode("image", "UTF-8") + "="
                    + URLEncoder.encode(imgStr, "UTF-8");
            /**
             * 线上环境access_token有过期时间, 客户端可自行缓存,过期后重新获取。
             */
            String accessToken = getAuth();
            String result = HttpUtil.post(idcardIdentificate, accessToken, params);
            System.out.println(result);
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

    public static String getAuth() {
        // 官网获取的 API Key 更新为你注册的
        String clientId = API_KEY;
        // 官网获取的 Secret Key 更新为你注册的
        String clientSecret = SECRET_KEY;
        return getAuth(clientId, clientSecret);
    }

    /**
     * 获取API访问token
     * 该token有一定的有效期,需要自行管理,当失效时需重新获取.
     * @param ak - 百度云官网获取的 API Key
     * @param sk - 百度云官网获取的 Securet Key
     * @return assess_token 示例:
     * "24.460da4889caad24cccdb1fea17221975.2592000.1491995545.282335-1234567"
     */
    public static String getAuth(String ak, String sk) {
        // 获取token地址
        String authHost = "https://aip.baidubce.com/oauth/2.0/token?";
        String getAccessTokenUrl = authHost
                // 1. grant_type为固定参数
                + "grant_type=client_credentials"
                // 2. 官网获取的 API Key
                + "&client_id=" + ak
                // 3. 官网获取的 Secret Key
                + "&client_secret=" + sk;
        try {
            URL realUrl = new URL(getAccessTokenUrl);
            // 打开和URL之间的连接
            HttpURLConnection connection = (HttpURLConnection) realUrl.openConnection();
            connection.setRequestMethod("GET");
            connection.connect();
            // 获取所有响应头字段
            Map<String, List<String>> map = connection.getHeaderFields();
            // 遍历所有的响应头字段
            for (String key : map.keySet()) {
                System.err.println(key + "--->" + map.get(key));
            }
            // 定义 BufferedReader输入流来读取URL的响应
            BufferedReader in = new BufferedReader(new InputStreamReader(connection.getInputStream()));
            String result = "";
            String line;
            while ((line = in.readLine()) != null) {
                result += line;
            }
            /**
             * 返回结果示例
             */
            System.err.println("result:" + result);
            JSONObject jsonObject = new JSONObject(result);
            String access_token = jsonObject.getString("access_token");
            return access_token;
        } catch (Exception e) {
            System.err.printf("获取token失败!");
            e.printStackTrace(System.err);
        }
        return null;
    }

}

识别的结果(部分内容隐藏):


{
  "log_id": 2372062689588418057,
  "words_result_num": 6,
  "direction": 1,
  "image_status": "normal",
  "words_result": {
    "住址": {
      "location": {
        "width": 364,
        "top": 2342,
        "height": 1072,
        "left": 1449
      },
      "words": "xxxxxxxxxxxx"
    },
    "出生": {
      "location": {
        "width": 90,
        "top": 2547,
        "height": 838,
        "left": 1230
      },
      "words": "xxxxxxx"
    },
    "姓名": {
      "location": {
        "width": 118,
        "top": 3053,
        "height": 336,
        "left": 801
      },
      "words": "xxxxxx"
    },
    "公民身份号码": {
      "location": {
        "width": 96,
        "top": 1539,
        "height": 1441,
        "left": 1986
      },
      "words": "xxxxxxxxxxxxxxx"
    },
    "性别": {
      "location": {
        "width": 84,
        "top": 3311,
        "height": 74,
        "left": 1037
      },
      "words": "男"
    },
    "民族": {
      "location": {
        "width": 80,
        "top": 2799,
        "height": 70,
        "left": 1031
      },
      "words": "汉"
    }
  }
}
正文到此结束(点击广告是对作者最大的支持)