1.文档提取接口说明

文档提取接口（API）定义：支持图片/PDF 文档信息提取，可根据提示词智能提取文档内容，返回结构化结果。

1.1主要功能

文档提取接口能够识别并提取图片/PDF中的文档信息。其主要功能包括：

智能提取:: 支持根据提示词智能提取文档中的关键信息。
多格式支持:: 支持图片和PDF格式的文档提取。
多页处理:: 支持多页PDF文档的批量提取处理。
稳定高效:: 提供稳定的服务，响应及时，处理速度快。

1.2API接入

支持各种程序和设备接入，包括小程序、APP、采集设备等，灵活适用于不同应用场景。

2.请求信息

2.1请求地址(URL)

POST https://ocr-api.shiliuai.com/api/doc_extract/v1

2.2请求方式

POST

2.3请求头(header)

参数	类型	说明
Content-Type	string	application/json
Authorization	string	'APPCODE ' + 您的AppCode(注意英文空格)获取

参数	类型	说明
Content-Type	string	application/json
x-ca-key	string	您的AppKey获取
x-ca-timestamp	string	时间戳（毫秒）
x-ca-signature	string	签名sign

str = app_key&timestamp&app_secret
sign = md5(str)

2.4请求体(body)

参数	是否必填	类型	说明
file_base64	必填其中之一	string	base64编码的图片文件或PDF文件
file_url	必填其中之一	string	图片文件或PDF文件的url
prompt	选填	string	关于文档信息提取的提示词，比如："以json格式输出文档内容。"，默认以text形式输出

3.返回信息

3.1返回类型

JSON

3.2返回码

参数名	类型	说明
code	int	返回码，200表示成功
msg	string	返回信息

3.3返回信息

参数名	类型	说明
code	int	错误码
msg	string	错误信息（英文）
msg_cn	string	错误信息（中文）
success	bool	识别是否成功
file_id	string	请求文件ID
request_id	string	唯一请求ID
data	object	具体见返回示例

3.4返回示例

成功返回示例

成功示例：
{
    'code': 200,
    'msg': 'OK',
    'msg_cn': '成功',
    'success': True,
    'file_id': file id,
    'request_id': request id,
    'data': {
        "page_count": 5,        // int, 文件页面总数
        "process_pages": 5,     // int, 处理页面数
        "content": content      // 文档提取结果
    }
}

错误返回示例

失败示例：
{
    'code': error code,
    'msg': error message,
    'msg_cn': 中文错误信息,
    'success': False,
    'file_id': file id,
    'request_id': request id,
    'data': {}
}

3.5错误码

错误码	说明
200	成功
400	请求错误
401	未授权
500	服务错误

具体错误原因请看msg或msg_cn

4.示例代码

4.1 Python

同步调用

# -*- coding: utf-8 -*-
import requests
import base64
import json

# 请求接口
URL = "https://ocr-api.shiliuai.com/api/doc_extract/v1"

# 图片/pdf文件转base64
def get_base64(file_path):
    with open(file_path, "rb") as f:
        data = f.read()
    return base64.b64encode(data).decode("utf8")

def demo(appcode, file_path):
    # 请求头
    headers = {
        "Authorization": "APPCODE %s" % appcode,
        "Content-Type": "application/json"
    }

    # 请求体
    b64 = get_base64(file_path)
    data = {
        "file_base64": b64,
        "prompt": ""
    }

    # 请求
    response = requests.post(url=URL, headers=headers, json=data)
    content = json.loads(response.content)
    print(content)

if __name__ == "__main__":
    appcode = "你的APPCODE"
    file_path = "本地文件路径"
    demo(appcode, file_path)

# -*- coding: utf-8 -*-
import requests
import base64
import json
import hashlib
import time

# 请求接口
URL = "https://ocr-api.shiliuai.com/api/doc_extract/v1"

# 图片/pdf文件转base64
def get_base64(file_path):
    with open(file_path, "rb") as f:
        data = f.read()
    return base64.b64encode(data).decode("utf8")

# md5
def md5(s):
    return hashlib.md5(s.encode("utf8")).hexdigest()

def demo(app_key, app_secret, file_path):
    # 请求头（签名）
    t = int(time.time() * 1000)
    s = "%s&%s&%s" % (app_key, t, app_secret)
    sign = md5(s)
    headers = {
        "x-ca-key": app_key,
        "x-ca-timestamp": str(t),
        "x-ca-signature": sign,
        "Content-Type": "application/json"
    }

    # 请求体
    b64 = get_base64(file_path)
    data = {
        "file_base64": b64,
        "prompt": ""
    }

    # 请求
    response = requests.post(url=URL, headers=headers, json=data)
    content = json.loads(response.content)
    print(content)

if __name__ == "__main__":
    app_key = "你的APP_KEY"
    app_secret = "你的APP_SECRET"
    file_path = "本地文件路径"
    demo(app_key, app_secret, file_path)

4.2 PHP

//图片/pdf转base64
function get_base64($path){
    if($fp = fopen($path, "rb", 0)) {
        $binary = fread($fp, filesize($path));// 文件读取
        fclose($fp);
        $b64 = base64_encode($binary);// 转base64
    }else{
        $b64="";
        printf("%s 文件不存在", $path);
    }
    return $b64;
}

$url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";
$appcode = "你的APPCODE";
$file_path = "文件路径";
$method = "POST";

// 请求头
$headers = array();
array_push($headers, "Authorization:APPCODE " . $appcode);
array_push($headers, "Content-Type:application/json");

// 请求体
$b64 = get_base64($file_path);
$data = array(
    "file_base64" => $b64,
    "prompt" => ""
);
$post_data = json_encode($data);

// 请求
$curl = curl_init();
curl_setopt($curl, CURLOPT_CUSTOMREQUEST, $method);
curl_setopt($curl, CURLOPT_URL, $url);
curl_setopt($curl, CURLOPT_HTTPHEADER, $headers);
curl_setopt($curl, CURLOPT_FAILONERROR, false);
curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
curl_setopt($curl, CURLOPT_HEADER, true);
curl_setopt($curl, CURLOPT_SSL_VERIFYPEER, false);
curl_setopt($curl, CURLOPT_SSL_VERIFYHOST, false);
curl_setopt($curl, CURLOPT_POSTFIELDS, $post_data);

$result = curl_exec($curl);
var_dump($result);

function get_base64($path){
    if($fp = fopen($path, "rb", 0)) {
        $binary = fread($fp, filesize($path));// 文件读取
        fclose($fp);
        $b64 = base64_encode($binary);// 转base64
    }else{
        $b64="";
        printf("%s 文件不存在", $path);
    }
    return $b64;
}

$url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";
$file_path = "文件路径";
$method = "POST";

//请求头（签名）
$app_key = "你的app_key";
$app_secret = "你的app_secret";
$timestamp = round(microtime(true) * 1000); // 毫秒时间戳
$sign_string = $app_key . "&" . $timestamp . "&" . $app_secret;
$sign = md5($sign_string);

$headers = array();
array_push($headers, "Content-Type:application/json");
array_push($headers, "x-ca-key:" . $app_key);
array_push($headers, "x-ca-timestamp:" . $timestamp);
array_push($headers, "x-ca-signature:" . $sign);

// 请求体
$b64 = get_base64($file_path);
$data = array(
    "file_base64" => $b64,
    "prompt" => ""
);
$post_data = json_encode($data);

// 请求
$curl = curl_init();
curl_setopt($curl, CURLOPT_CUSTOMREQUEST, $method);
curl_setopt($curl, CURLOPT_URL, $url);
curl_setopt($curl, CURLOPT_HTTPHEADER, $headers);
curl_setopt($curl, CURLOPT_FAILONERROR, false);
curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
curl_setopt($curl, CURLOPT_HEADER, true);
curl_setopt($curl, CURLOPT_SSL_VERIFYPEER, false);
curl_setopt($curl, CURLOPT_SSL_VERIFYHOST, false);
curl_setopt($curl, CURLOPT_POSTFIELDS, $post_data);

$result = curl_exec($curl);
var_dump($result);

4.3 Java

import com.alibaba.fastjson2.JSON;
import com.alibaba.fastjson2.JSONObject;
import org.apache.http.HttpResponse;
import org.apache.http.client.methods.HttpPost;
import org.apache.http.entity.StringEntity;
import org.apache.http.impl.client.CloseableHttpClient;
import org.apache.http.impl.client.HttpClients;
import org.apache.http.util.EntityUtils;
import org.apache.commons.io.FileUtils;
import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
import java.util.Base64;

public class Main {
    public static String get_base64(String path) {
        String b64 = "";
        try {
            byte[] content = FileUtils.readFileToByteArray(new File(path));
            b64 = Base64.getEncoder().encodeToString(content);
        } catch (IOException e) {
            e.printStackTrace();
        }
        return b64;
    }

    public static void main(String[] args) {
        String url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";// 请求接口
        String appcode = "你的APPCODE";
        String file_path = "本地文件路径";

        Map headers = new HashMap<>();
        headers.put("Authorization", "APPCODE " + appcode);
        headers.put("Content-Type", "application/json");

        JSONObject requestObj = new JSONObject();
        requestObj.put("file_base64", get_base64(file_path));
        requestObj.put("prompt", "");
        String bodys = requestObj.toString();

        try (CloseableHttpClient httpClient = HttpClients.createDefault()) {
            HttpPost httpPost = new HttpPost(url);
            for (Map.Entry entry : headers.entrySet()) {
                httpPost.addHeader(entry.getKey(), entry.getValue());
            }
            StringEntity entity = new StringEntity(bodys, "UTF-8");
            httpPost.setEntity(entity);
            HttpResponse response = httpClient.execute(httpPost);
            int stat = response.getStatusLine().getStatusCode();
            if (stat != 200) {
                System.out.println("Http code: " + stat);
                return;
            }
            String res = EntityUtils.toString(response.getEntity());
            JSONObject res_obj = JSON.parseObject(res);
            System.out.println(res_obj.toJSONString());
        } catch (Exception e) {
            e.printStackTrace();
        }
    }
}

import com.alibaba.fastjson2.JSON;
import com.alibaba.fastjson2.JSONObject;
import org.apache.commons.io.FileUtils;
import org.apache.http.HttpResponse;
import org.apache.http.client.methods.HttpPost;
import org.apache.http.entity.StringEntity;
import org.apache.http.impl.client.CloseableHttpClient;
import org.apache.http.impl.client.HttpClients;
import org.apache.http.util.EntityUtils;
import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
import java.util.Base64;
import java.security.MessageDigest;
import java.security.NoSuchAlgorithmException;

public class Demo {
    public static String get_base64(String path) {
        String b64 = "";
        try {
            File file = new File(path);
            if (!file.exists()) {
                System.err.println("文件不存在: " + path);
                return b64;
            }
            byte[] content = FileUtils.readFileToByteArray(file);
            b64 = Base64.getEncoder().encodeToString(content);
        } catch (IOException e) {
            System.err.println("读取文件失败: " + e.getMessage());
            e.printStackTrace();
        }
        return b64;
    }

    public static String MD5(String input) {
        try {
            MessageDigest md = MessageDigest.getInstance("MD5");
            byte[] messageDigest = md.digest(input.getBytes());
            StringBuilder hexString = new StringBuilder();
            for (byte b : messageDigest) {
                String hex = Integer.toHexString(0xff & b);
                if (hex.length() == 1) hexString.append('0');
                hexString.append(hex);
            }
            return hexString.toString();
        } catch (NoSuchAlgorithmException e) {
            e.printStackTrace();
        }
        return null;
    }

    public static void main(String[] args) {
        String url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";// 请求接口
        String file_path = "本地文件路径";
        String app_key = "你的APPKEY";
        String app_secret = "你的APPSECRET";
        String timestamp = System.currentTimeMillis() + "";
        String sign = MD5(app_key + "&" + timestamp + "&" + app_secret);

        Map headers = new HashMap<>();
        headers.put("Content-Type", "application/json");
        headers.put("x-ca-key", app_key);
        headers.put("x-ca-timestamp", timestamp);
        headers.put("x-ca-signature", sign);

        JSONObject requestObj = new JSONObject();
        requestObj.put("file_base64", get_base64(file_path));
        requestObj.put("prompt", "");
        String bodys = requestObj.toString();

        try (CloseableHttpClient httpClient = HttpClients.createDefault()) {
            HttpPost httpPost = new HttpPost(url);
            for (Map.Entry entry : headers.entrySet()) {
                httpPost.addHeader(entry.getKey(), entry.getValue());
            }
            StringEntity entity = new StringEntity(bodys, "UTF-8");
            httpPost.setEntity(entity);
            HttpResponse response = httpClient.execute(httpPost);
            int stat = response.getStatusLine().getStatusCode();
            if (stat != 200) {
                System.out.println("Http code: " + stat);
                System.out.println("Http  " + EntityUtils.toString(response.getEntity()));
                return;
            }
            String res = EntityUtils.toString(response.getEntity());
            JSONObject res_obj = JSON.parseObject(res);
            System.out.println(res_obj.toJSONString());
        } catch (Exception e) {
            e.printStackTrace();
        }
    }
}

4.4 JavaScript

// 需 Node.js 18+（内置 fetch）
const fs = require('fs');

const apiUrl = 'https://ocr-api.shiliuai.com/api/doc_extract/v1';
const appcode = '你的APPCODE';
const filePath = '本地文件路径';

async function main() {
  const fileBase64 = fs.readFileSync(filePath).toString('base64');

  const res = await fetch(apiUrl, {
    method: 'POST',
    headers: {
      Authorization: 'APPCODE ' + appcode,
      'Content-Type': 'application/json'
    },
    body: JSON.stringify({ file_base64: fileBase64, prompt: '' })
  });

  const text = await res.text();
  if (!res.ok) {
    console.error('Http code:', res.status, text);
    return;
  }
  console.log(JSON.stringify(JSON.parse(text), null, 2));
}

main().catch(console.error);

// 需 Node.js 18+（内置 fetch）
const fs = require('fs');
const crypto = require('crypto');

const apiUrl = 'https://ocr-api.shiliuai.com/api/doc_extract/v1';
const filePath = '本地文件路径';
const appKey = '你的APPKEY';
const appSecret = '你的APPSECRET';
const timestamp = Date.now().toString();
const signHex = crypto.createHash('md5').update(appKey + '&' + timestamp + '&' + appSecret).digest('hex');

async function main() {
  const fileBase64 = fs.readFileSync(filePath).toString('base64');

  const res = await fetch(apiUrl, {
    method: 'POST',
    headers: {
      'Content-Type': 'application/json',
      'x-ca-key': appKey,
      'x-ca-timestamp': timestamp,
      'x-ca-signature': signHex
    },
    body: JSON.stringify({ file_base64: fileBase64, prompt: '' })
  });

  const text = await res.text();
  if (!res.ok) {
    console.error('Http code:', res.status, text);
    return;
  }
  console.log(JSON.stringify(JSON.parse(text), null, 2));
}

main().catch(console.error);

4.5 NodeJs

const request = require("request");
const fs = require("fs");

const apiUrl = 'https://ocr-api.shiliuai.com/api/doc_extract/v1';
const appcode = '你的APPCODE';
const filePath = '本地文件路径';

function main() {
  const fileBase64 = fs.readFileSync(filePath).toString('base64');
  const options = {
    method: "POST",
    url: apiUrl,
    headers: {
      Authorization: "APPCODE " + appcode,
      "Content-Type": "application/json",
    },
    body: JSON.stringify({ file_base64: fileBase64, prompt: '' }),
  };

  request(options, function (error, response, body) {
    if (error) {
      console.error(error);
      return;
    }
    if (response.statusCode !== 200) {
      console.error('Http code:', response.statusCode, body);
      return;
    }
    let data = body;
    try {
      if (typeof body === 'string') data = JSON.parse(body);
    } catch (e) {}
    console.log(JSON.stringify(data, null, 2));
  });
}

main();

const request = require("request");
const fs = require("fs");
const crypto = require("crypto");

const apiUrl = 'https://ocr-api.shiliuai.com/api/doc_extract/v1';
const appKey = '你的APPKEY';
const appSecret = '你的APPSECRET';
const filePath = '本地文件路径';

function main() {
  const fileBase64 = fs.readFileSync(filePath).toString('base64');
  const timestamp = Date.now().toString();
  const signHex = crypto.createHash('md5').update(appKey + '&' + timestamp + '&' + appSecret).digest('hex');
  const options = {
    method: "POST",
    url: apiUrl,
    headers: {
      "Content-Type": "application/json",
      "x-ca-key": appKey,
      "x-ca-timestamp": timestamp,
      "x-ca-signature": signHex,
    },
    body: JSON.stringify({ file_base64: fileBase64, prompt: '' }),
  };

  request(options, function (error, response, body) {
    if (error) {
      console.error(error);
      return;
    }
    if (response.statusCode !== 200) {
      console.error('Http code:', response.statusCode, body);
      return;
    }
    let data = body;
    try {
      if (typeof body === 'string') data = JSON.parse(body);
    } catch (e) {}
    console.log(JSON.stringify(data, null, 2));
  });
}

main();

4.6 cURL

# 将图片/文件转为 base64 后填入请求体（Linux/macOS 示例）
# IMAGE_BASE64=$(base64 -w 0 /path/to/image.jpg)

curl -k 'https://ocr-api.shiliuai.com/api/doc_extract/v1' \
  -H 'Authorization: APPCODE 你的APPCODE' \
  -H 'Content-Type: application/json' \
  -d '{"file_base64":"文件base64编码"}'

# 签名规则见文档「签名认证」章节
# sign = md5(appKey + '&' + timestamp + '&' + appSecret)

curl -k 'https://ocr-api.shiliuai.com/api/doc_extract/v1' \
  -H 'Content-Type: application/json' \
  -H 'x-ca-key: 你的APPKEY' \
  -H 'x-ca-timestamp: 时间戳毫秒' \
  -H 'x-ca-signature: 签名值' \
  -d '{"file_base64":"文件base64编码"}'

4.7 C#

using System;
using System.Collections.Generic;
using System.IO;
using System.Net.Http;
using System.Text;
using System.Threading.Tasks;
using Newtonsoft.Json;
using Newtonsoft.Json.Linq;

namespace MyCSharpApp
{
    public class Program
    {
        public static string GetBase64(string path)
        {
            string b64 = "";
            try
            {
                byte[] content = File.ReadAllBytes(path);
                b64 = Convert.ToBase64String(content);
            }
            catch (Exception e)
            {
                Console.WriteLine(e.Message);
            }
            return b64;
        }

        public static async Task Main(string[] args)
        {
            string url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";// 请求接口
            string appcode = "你的APPCODE";
            string file_path = "本地文件路径";

            Dictionary headers = new Dictionary
            {
                { "Authorization", "APPCODE " + appcode }
            };

            JObject requestObj = new JObject();
            requestObj["file_base64"] = GetBase64(file_path);
            requestObj["prompt"] = "";
            string body = requestObj.ToString();

            try
            {
                using (HttpClient client = new HttpClient())
                {
                    foreach (var header in headers)
                    {
                        client.DefaultRequestHeaders.Add(header.Key, header.Value);
                    }
                    StringContent content = new StringContent(body, Encoding.UTF8, "application/json");
                    HttpResponseMessage response = await client.PostAsync(url, content);
                    if (!response.IsSuccessStatusCode)
                    {
                        Console.WriteLine($"Http code: {(int)response.StatusCode}");
                        return;
                    }
                    string responseContent = await response.Content.ReadAsStringAsync();
                    JObject resObj = JObject.Parse(responseContent);
                    Console.WriteLine(resObj.ToString(Formatting.Indented));
                }
            }
            catch (Exception e)
            {
                Console.WriteLine(e.Message);
            }
        }
    }
}

using System;
using System.Collections.Generic;
using System.IO;
using System.Net.Http;
using System.Security.Cryptography;
using System.Text;
using System.Threading.Tasks;
using Newtonsoft.Json;
using Newtonsoft.Json.Linq;

namespace MyCSharpApp
{
    public class Program
    {
        public static string GetBase64(string path)
        {
            string b64 = "";
            try
            {
                byte[] content = File.ReadAllBytes(path);
                b64 = Convert.ToBase64String(content);
            }
            catch (Exception e)
            {
                Console.Error.WriteLine("读取文件失败: " + e.Message);
            }
            return b64;
        }

        public static string CalculateMD5(string input)
        {
            try
            {
                using (MD5 md5 = MD5.Create())
                {
                    byte[] inputBytes = Encoding.UTF8.GetBytes(input);
                    byte[] hashBytes = md5.ComputeHash(inputBytes);
                    StringBuilder sb = new StringBuilder();
                    for (int i = 0; i < hashBytes.Length; i++)
                    {
                        sb.Append(hashBytes[i].ToString("x2"));
                    }
                    return sb.ToString();
                }
            }
            catch (Exception e)
            {
                Console.WriteLine(e.Message);
                return string.Empty;
            }
        }

        public static async Task Main(string[] args)
        {
            string url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";// 请求接口
            string file_path = "本地文件路径";
            string app_key = "你的APPKEY";
            string app_secret = "你的APPSECRET";
            string timestamp = DateTimeOffset.Now.ToUnixTimeMilliseconds().ToString();
            string sign = CalculateMD5(app_key + "&" + timestamp + "&" + app_secret);

            Dictionary headers = new Dictionary
            {
                { "x-ca-key", app_key },
                { "x-ca-timestamp", timestamp },
                { "x-ca-signature", sign }
            };

            JObject requestObj = new JObject();
            requestObj["file_base64"] = GetBase64(file_path);
            requestObj["prompt"] = "";
            string body = requestObj.ToString();

            try
            {
                using (HttpClient client = new HttpClient())
                {
                    foreach (var header in headers)
                    {
                        client.DefaultRequestHeaders.Add(header.Key, header.Value);
                    }
                    StringContent content = new StringContent(body, Encoding.UTF8, "application/json");
                    HttpResponseMessage response = await client.PostAsync(url, content);
                    if (!response.IsSuccessStatusCode)
                    {
                        Console.WriteLine($"Http code: {(int)response.StatusCode}");
                        Console.WriteLine($"Http {await response.Content.ReadAsStringAsync()}");
                        return;
                    }
                    string responseContent = await response.Content.ReadAsStringAsync();
                    JObject resObj = JObject.Parse(responseContent);
                    Console.WriteLine(resObj.ToString(Formatting.Indented));
                }
            }
            catch (Exception e)
            {
                Console.WriteLine(e.Message);
            }
        }
    }
}

4.8 Go

package main

import (
	"bytes"
	"encoding/base64"
	"encoding/json"
	"fmt"
	"io"
	"net/http"
	"os"
)

// 请求接口
const URL = "https://ocr-api.shiliuai.com/api/doc_extract/v1"

// RequestBody 请求体结构
type RequestBody struct {
	FileBase64 string `json:"file_base64"`
	Prompt     string `json:"prompt"`
}

// 图片转base64
func getBase64(filePath string) (string, error) {
	data, err := os.ReadFile(filePath)
	if err != nil {
		return "", fmt.Errorf("读取文件失败: %w", err)
	}
	b64 := base64.StdEncoding.EncodeToString(data)
	return b64, nil
}

func demo(appcode, filePath string) error {
	b64, err := getBase64(filePath)
	if err != nil {
		return fmt.Errorf("获取base64编码失败: %w", err)
	}

	reqBody := RequestBody{
		FileBase64: b64,
		Prompt:     "",
	}
	jsonData, err := json.Marshal(reqBody)
	if err != nil {
		return fmt.Errorf("序列化请求体失败: %w", err)
	}

	req, err := http.NewRequest("POST", URL, bytes.NewBuffer(jsonData))
	if err != nil {
		return fmt.Errorf("创建请求失败: %w", err)
	}

	req.Header.Set("Authorization", fmt.Sprintf("APPCODE %s", appcode))
	req.Header.Set("Content-Type", "application/json")

	client := &http.Client{}
	resp, err := client.Do(req)
	if err != nil {
		return fmt.Errorf("发送请求失败: %w", err)
	}
	defer resp.Body.Close()

	body, err := io.ReadAll(resp.Body)
	if err != nil {
		return fmt.Errorf("读取响应失败: %w", err)
	}

	var content interface{}
	if err := json.Unmarshal(body, &content); err != nil {
		return fmt.Errorf("解析响应JSON失败: %w", err)
	}

	fmt.Printf("%+v\n", content)
	return nil
}

func main() {
	appcode := "你的APPCODE"
	filePath := "本地文件路径"

	if err := demo(appcode, filePath); err != nil {
		fmt.Fprintf(os.Stderr, "错误: %v\n", err)
		os.Exit(1)
	}
}

package main

import (
	"bytes"
	"crypto/md5"
	"encoding/base64"
	"encoding/hex"
	"encoding/json"
	"fmt"
	"io"
	"net/http"
	"os"
	"strconv"
	"time"
)

// 请求接口
const URL = "https://ocr-api.shiliuai.com/api/doc_extract/v1"

// RequestBody 请求体结构
type RequestBody struct {
	FileBase64 string `json:"file_base64"`
	Prompt     string `json:"prompt"`
}

// 图片转base64
func getBase64(filePath string) (string, error) {
	data, err := os.ReadFile(filePath)
	if err != nil {
		return "", fmt.Errorf("读取文件失败: %w", err)
	}
	b64 := base64.StdEncoding.EncodeToString(data)
	return b64, nil
}

func md5Hex(s string) string {
	h := md5.Sum([]byte(s))
	return hex.EncodeToString(h[:])
}

func demo(appKey, appSecret, filePath string) error {
	b64, err := getBase64(filePath)
	if err != nil {
		return fmt.Errorf("获取base64编码失败: %w", err)
	}

	reqBody := RequestBody{
		FileBase64: b64,
		Prompt:     "",
	}
	jsonData, err := json.Marshal(reqBody)
	if err != nil {
		return fmt.Errorf("序列化请求体失败: %w", err)
	}

	ts := strconv.FormatInt(time.Now().UnixMilli(), 10)
	sign := md5Hex(appKey + "&" + ts + "&" + appSecret)

	req, err := http.NewRequest("POST", URL, bytes.NewBuffer(jsonData))
	if err != nil {
		return fmt.Errorf("创建请求失败: %w", err)
	}

	req.Header.Set("x-ca-key", appKey)
	req.Header.Set("x-ca-timestamp", ts)
	req.Header.Set("x-ca-signature", sign)
	req.Header.Set("Content-Type", "application/json")

	client := &http.Client{}
	resp, err := client.Do(req)
	if err != nil {
		return fmt.Errorf("发送请求失败: %w", err)
	}
	defer resp.Body.Close()

	body, err := io.ReadAll(resp.Body)
	if err != nil {
		return fmt.Errorf("读取响应失败: %w", err)
	}

	var content interface{}
	if err := json.Unmarshal(body, &content); err != nil {
		return fmt.Errorf("解析响应JSON失败: %w", err)
	}

	fmt.Printf("%+v\n", content)
	return nil
}

func main() {
	appKey := "你的APP_KEY"
	appSecret := "你的APP_SECRET"
	filePath := "本地文件路径"

	if err := demo(appKey, appSecret, filePath); err != nil {
		fmt.Fprintf(os.Stderr, "错误: %v\n", err)
		os.Exit(1)
	}
}

4.9 易语言

版本 2
.支持库 spec
.支持库 dp1

.子程序 OCR_简单认证
.局部变量 局_网址, 文本型
.局部变量 局_提交数据, 文本型
.局部变量 局_提交协议头, 文本型
.局部变量 局_结果, 字节集
.局部变量 局_返回, 文本型
.局部变量 图片数据, 字节集
.局部变量 base64图片, 文本型

图片数据 ＝ 读入文件 ("你的文件路径")
base64图片 ＝ 编码_BASE64编码 (图片数据)
局_提交数据 ＝ "{" ＋ #引号 ＋ "file_base64" ＋ #引号 ＋ ":" ＋ #引号 ＋ base64图片 ＋ #引号 ＋ "}"
局_网址 ＝ "https://ocr-api.shiliuai.com/api/doc_extract/v1"
局_提交协议头 ＝ "Authorization: APPCODE 你的AppCode" ＋ #换行符 ＋ "Content-Type: application/json"
局_结果 ＝ 网页_访问_对象 (局_网址, 1, 局_提交数据, , , 局_提交协议头, , , , , , , , , , , , , )
局_返回 ＝ 到文本 (编码_编码转换对象 (局_结果, , , ))
返回 (局_返回)

版本 2
.支持库 spec
.支持库 dp1

.子程序 OCR_签名认证
.参数 app_key, 文本型
.参数 app_secret, 文本型
.参数 文件路径, 文本型
.局部变量 局_网址, 文本型
.局部变量 局_提交数据, 文本型
.局部变量 局_提交协议头, 文本型
.局部变量 局_结果, 字节集
.局部变量 局_返回, 文本型
.局部变量 文件数据, 字节集
.局部变量 base64文件, 文本型
.局部变量 时间戳, 文本型
.局部变量 签名字符串, 文本型
.局部变量 签名, 文本型

文件数据 ＝ 读入文件 (文件路径)
base64文件 ＝ 编码_BASE64编码 (文件数据)
时间戳 ＝ 到文本 (时间_取时间戳 () * 1000)
签名字符串 ＝ app_key ＋ "&" ＋ 时间戳 ＋ "&" ＋ app_secret
签名 ＝ 到十六进制文本 (编码_MD5摘要 (到字节集 (签名字符串)))

局_提交数据 ＝ "{" ＋ #引号 ＋ "file_base64" ＋ #引号 ＋ ":" ＋ #引号 ＋ base64文件 ＋ #引号 ＋ "}"
局_网址 ＝ "https://ocr-api.shiliuai.com/api/doc_extract/v1"
局_提交协议头 ＝ "x-ca-key: " ＋ app_key ＋ #换行符 ＋ "x-ca-timestamp: " ＋ 时间戳 ＋ #换行符 ＋ "x-ca-signature: " ＋ 签名 ＋ #换行符 ＋ "Content-Type: application/json"
局_结果 ＝ 网页_访问_对象 (局_网址, 1, 局_提交数据, , , 局_提交协议头, , , , , , , , , , , , , )
局_返回 ＝ 到文本 (编码_编码转换对象 (局_结果, , , ))
返回 (局_返回)

4.10 天诺

public static string OCR_Easy(Image image, string appcode)
{
    string url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";
    var headers = new Dictionary<string, string>
    {
        {"Authorization", "APPCODE " + appcode},
        {"Content-Type", "application/json"}
    };
    string body = "{\"file_base64\":\"" + CustomHelp.ImageTobase64(image) + "\"}";
    return CustomHelp.HttpPost(url, body, headers);
}

public static string app_key = "你的APPKEY";
public static string app_secret = "你的APPSECRET";

public static string GetTimestampMs()
{
    return DateTimeOffset.Now.ToUnixTimeMilliseconds().ToString();
}

public static string MD5(string input)
{
    using (var md5 = System.Security.Cryptography.MD5.Create())
    {
        var bytes = System.Text.Encoding.UTF8.GetBytes(input);
        var hash = md5.ComputeHash(bytes);
        var sb = new System.Text.StringBuilder();
        foreach (var b in hash) sb.Append(b.ToString("x2"));
        return sb.ToString();
    }
}

public static string OCR_Sign(Image image)
{
    string url = "https://ocr-api.shiliuai.com/api/doc_extract/v1";
    string timestamp = GetTimestampMs();
    string sign = MD5(app_key + "&" + timestamp + "&" + app_secret);

    var headers = new Dictionary<string, string>
    {
        {"x-ca-key", app_key},
        {"x-ca-timestamp", timestamp},
        {"x-ca-signature", sign},
        {"Content-Type", "application/json"}
    };

    string body = "{\"file_base64\":\"" + CustomHelp.ImageTobase64(image) + "\"}";
    return CustomHelp.HttpPost(url, body, headers);
}

4.11 按键精灵-电脑版

Import "Encrypt.dll"
VBSBegin
Function Base64Encode(filePath)
    Set inStream = CreateObject("ADODB.Stream")
    inStream.Type = 1
    inStream.Open
    inStream.LoadFromFile filePath
    inStream.Position = 0
    Set dom = CreateObject("MSXML2.DOMDocument")
    Set elem = dom.createElement("tmp")
    elem.dataType = "bin.base64"
    elem.nodeTypedValue = inStream.Read
    Base64Encode = elem.Text
    inStream.Close
End Function

Function ocr_easy(appcode, imgPath)
    url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    jsonBody = "{\"file_base64\":\"" & Base64Encode(imgPath) & "\"}"
    Set http = CreateObject("MSXML2.XMLHTTP")
    http.Open "POST", url, False
    http.setRequestHeader "Authorization", "APPCODE " & appcode
    http.setRequestHeader "Content-Type", "application/json"
    http.send jsonBody
    ocr_easy = http.responseText
End Function
VBSEnd

appcode = "你的APPCODE"
res = ocr_easy(appcode, "你的文件路径")
TracePrint res

Import "Encrypt.dll"
VBSBegin
Function MD5(str)
    MD5 = LCase(Encrypt.Md5String(str))
End Function

Function Base64Encode(filePath)
    Set inStream = CreateObject("ADODB.Stream")
    inStream.Type = 1
    inStream.Open
    inStream.LoadFromFile filePath
    inStream.Position = 0
    Set dom = CreateObject("MSXML2.DOMDocument")
    Set elem = dom.createElement("tmp")
    elem.dataType = "bin.base64"
    elem.nodeTypedValue = inStream.Read
    Base64Encode = elem.Text
    inStream.Close
End Function

Function ocr_sign(appKey, appSecret, imgPath)
    url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    timestamp = CStr(DateDiff("s", "01/01/1970 00:00:00", Now()) * 1000)
    signature = MD5(appKey & "&" & timestamp & "&" & appSecret)
    jsonBody = "{\"file_base64\":\"" & Base64Encode(imgPath) & "\"}"
    Set http = CreateObject("MSXML2.XMLHTTP")
    http.Open "POST", url, False
    http.setRequestHeader "x-ca-key", appKey
    http.setRequestHeader "x-ca-timestamp", timestamp
    http.setRequestHeader "x-ca-signature", signature
    http.setRequestHeader "Content-Type", "application/json"
    http.send jsonBody
    ocr_sign = http.responseText
End Function
VBSEnd

appKey = "你的APPKEY"
appSecret = "你的APPSECRET"
res = ocr_sign(appKey, appSecret, "你的文件路径")
TracePrint res

4.12 按键精灵-手机版

Import "yd.luae"
Import "zm.luae"

Dim imagePath = "/sdcard/Pictures/test.png"
SnapShotEx imagePath

Function ocr_easy(appcode, imagePath)
    Dim url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    Dim body = "{\"file_base64\":\"" & yd.Base64EncodeFile(imagePath) & "\"}"
    Dim headers = {null}
    headers["Authorization"] = "APPCODE " & appcode
    headers["Content-Type"] = "application/json"
    Dim res = yd.HttpPost(url, body, headers)
    ocr_easy = yd.JsonDecode(res)
End Function

Dim appcode = "你的 APPCODE"
Dim t1 = TickCount()
Dim res = ocr_easy(appcode, imagePath)
Dim t2 = TickCount()
TracePrint res["code"]

Import "yd.luae"
Import "zm.luae"

Dim imagePath = "/sdcard/Pictures/test.png"
SnapShotEx imagePath

Dim appKey = "你的 APPKEY"
Dim appSecret = "你的 APPSECRET"

Function ocr_sign(appKey, appSecret, imagePath)
    Dim url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    Dim timestamp = CStr(os.time()*1000)
    Dim signature = Encode.Md5(appKey & "&" & timestamp & "&" & appSecret)
    Dim body = "{\"file_base64\":\"" & yd.Base64EncodeFile(imagePath) & "\"}"
    Dim headers = {null}
    headers["x-ca-key"] = appKey
    headers["x-ca-timestamp"] = timestamp
    headers["x-ca-signature"] = signature
    headers["Content-Type"] = "application/json"
    Dim res = yd.HttpPost(url, body, headers)
    ocr_sign = yd.JsonDecode(res)
End Function

Dim t1 = TickCount()
Dim res = ocr_sign(appKey, appSecret, imagePath)
Dim t2 = TickCount()
TracePrint res["code"]

4.13 触动精灵

require("tsnet")
require "TSLib"
local ts = require("ts")
local json = ts.json

function readFileBase64(path)
    local f = io.open(path,"rb")
    if not f then return nil end
    local bytes = f:read("*all")
    f:close()
    return bytes:base64_encode()
end

function ocr_easy(appcode, imagePath)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local body = json.encode({ file_base64 = readFileBase64(imagePath) })
    local headers = {}
    headers["Authorization"] = "APPCODE " .. appcode
    headers["Content-Type"] = "application/json"
    local resp = httpPost(url, body, { headers = headers })
    return json.decode(resp)
end

require("tsnet")
require "TSLib"
local ts = require("ts")
local json = ts.json

function readFileBase64(path)
    local f = io.open(path,"rb")
    if not f then return nil end
    local bytes = f:read("*all")
    f:close()
    return bytes:base64_encode()
end

function ocr_sign(appKey, appSecret, imagePath)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local timestamp = tostring(os.time()*1000)
    local signature = (appKey.."&"..timestamp.."&"..appSecret):md5()
    local body = json.encode({ file_base64 = readFileBase64(imagePath) })
    local headers = {}
    headers["x-ca-key"] = appKey
    headers["x-ca-timestamp"] = timestamp
    headers["x-ca-signature"] = signature
    headers["Content-Type"] = "application/json"
    local resp = httpPost(url, body, { headers = headers })
    return json.decode(resp)
end

4.14 懒人精灵

function ocr_easy(appcode, imagePath)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local body = jsonLib.encode({ file_base64 = getFileBase64(imagePath) })
    local headers = {}
    headers["Authorization"] = "APPCODE " .. appcode
    headers["Content-Type"] = "application/json"
    local resp = httpPost(url, body, { headers = headers })
    return jsonLib.decode(resp)
end

function ocr_sign(appKey, appSecret, imagePath)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local timestamp = tostring(os.time()*1000)
    local signature = MD5(appKey.."&"..timestamp.."&"..appSecret)
    local body = jsonLib.encode({ file_base64 = getFileBase64(imagePath) })
    local headers = {}
    headers["x-ca-key"] = appKey
    headers["x-ca-timestamp"] = timestamp
    headers["x-ca-signature"] = signature
    headers["Content-Type"] = "application/json"
    local resp = httpPost(url, body, { headers = headers })
    return jsonLib.decode(resp)
end

4.15 EasyClick

function main()
    local request = image.requestScreenCapture(10000, 0)
    if not request then
        request = image.requestScreenCapture(10000, 0)
    end
    local appCode = "你的 APPCODE"
    local img = image.captureFullScreenEx()
    local res = ocr_easy(appCode, img)
    logd(res.code)
end

function ocr_easy(appCode, img)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local imgBase64 = image.toBase64Format(img, "jpg", 100)
    image.recycle(img)
    local body = JSON.stringify({ file_base64 = imgBase64 })
    local params = {
        url = url,
        method = "POST",
        headers = {
            ["Authorization"] = "APPCODE " .. appCode,
            ["Content-Type"] = "application/json"
        },
        requestBody = body
    }
    local res = http.request(params)
    return JSON.parse(res.body)
end

function main()
    local request = image.requestScreenCapture(10000, 0)
    if not request then
        request = image.requestScreenCapture(10000, 0)
    end
    local appKey = "你的 APPKEY"
    local appSecret = "你的 APPSECRET"
    local img = image.captureFullScreenEx()
    local res = ocr_sign(appKey, appSecret, img)
    logd(res.code)
end

function ocr_sign(appKey, appSecret, img)
    local url = "https://ocr-api.shiliuai.com/api/doc_extract/v1"
    local imgBase64 = image.toBase64Format(img, "jpg", 100)
    local timestamp = tostring(os.time() * 1000)
    local signature = utils.dataMd5(appKey .. "&" .. timestamp .. "&" .. appSecret)
    image.recycle(img)
    local body = JSON.stringify({ file_base64 = imgBase64 })
    local params = {
        url = url,
        method = "POST",
        headers = {
            ["x-ca-key"] = appKey,
            ["x-ca-timestamp"] = timestamp,
            ["x-ca-signature"] = signature,
            ["Content-Type"] = "application/json"
        },
        requestBody = body
    }
    local res = http.request(params)
    return JSON.parse(res.body)
end