PDF识别

本文介绍PDF识别常用语言和常见情况的示例代码。

说明
  • 您可以进入在线咨询获取在线人工帮助。

  • 阿里云视觉智能开放平台视觉AI能力API接入、接口使用或问题咨询等,请通过钉钉群(23109592)加入阿里云视觉智能开放平台咨询群联系我们。

能力介绍

PDF识别能力介绍及调用参数,详情请参见PDF识别

SDK包安装

常见语言的SDK依赖包信息,详情请参见SDK总览

配置环境变量

配置环境变量ALIBABA_CLOUD_ACCESS_KEY_IDALIBABA_CLOUD_ACCESS_KEY_SECRET

重要
  • 阿里云账号AccessKey拥有所有API的访问权限,建议您使用RAM用户进行API访问或日常运维,具体操作,请参见创建RAM用户

  • 请不要将AccessKey ID和AccessKey Secret保存到工程代码里,否则可能导致AccessKey泄露,威胁您账号下所有资源的安全。

  • Linux和macOS系统配置方法

    1. 在IntelliJ IDEA中打开终端Terminal。

    2. 执行以下命令,配置环境变量。

      <access_key_id>需替换为您RAM用户的AccessKey ID,<access_key_secret>替换为您RAM用户的AccessKey Secret。如果后续需要进行更多权限相关的配置,具体操作请参见使用RAM Policy控制访问权限

      export ALIBABA_CLOUD_ACCESS_KEY_ID=<access_key_id> 
      export ALIBABA_CLOUD_ACCESS_KEY_SECRET=<access_key_secret>
  • Windows系统配置方法

    新建环境变量文件,添加环境变量ALIBABA_CLOUD_ACCESS_KEY_IDALIBABA_CLOUD_ACCESS_KEY_SECRET,并写入已准备好的AccessKey ID和AccessKey Secret。然后重启Windows系统。本操作以Windows 10为例进行说明。

    1. 打开文件资源管理器,在此电脑上右键单击属性。

    2. 在右侧导航栏,单击高级系统配置

    3. 系统属性对话框的高级页签下,单击环境变量

    4. 环境变量对话框中,单击新建(W)image.png

    5. 在弹出的新建系统变量对话框中,添加环境变量ALIBABA_CLOUD_ACCESS_KEY_IDALIBABA_CLOUD_ACCESS_KEY_SECRET,并写入已准备好的AccessKey ID和AccessKey Secret。

    6. 重启Windows系统,使配置生效。

示例代码

文件在上海地域OSS

/*
引入依赖包
<!-- https://mvnrepository.com/artifact/com.aliyun/ocr20191230 -->
<dependency>
  	<groupId>com.aliyun</groupId>
  	<artifactId>ocr20191230</artifactId>
  	<version>${aliyun.ocr.version}</version>
</dependency>
*/

import com.aliyun.ocr20191230.models.RecognizePdfResponse;
import com.aliyun.tea.TeaModel;

public class RecognizePdf {
    public static com.aliyun.ocr20191230.Client createClient(String accessKeyId, String accessKeySecret) throws Exception {
        /*
          初始化配置对象com.aliyun.teaopenapi.models.Config
          Config对象存放 AccessKeyId、AccessKeySecret、endpoint等配置
         */
         com.aliyun.teaopenapi.models.Config config = new com.aliyun.teaopenapi.models.Config()
                .setAccessKeyId(accessKeyId)
                .setAccessKeySecret(accessKeySecret);
        // 访问的域名
        config.endpoint = "ocr.cn-shanghai.aliyuncs.com";
        return new com.aliyun.ocr20191230.Client(config);
    }

    public static void main(String[] args_) throws Exception {
        // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html
        // 如果您使用的是RAM用户的AccessKey,还需要为子账号授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html
        // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
        String accessKeyId = System.getenv("ALIBABA_CLOUD_ACCESS_KEY_ID");
        String accessKeySecret = System.getenv("ALIBABA_CLOUD_ACCESS_KEY_SECRET"); 
        com.aliyun.ocr20191230.Client client = RecognizePdf.createClient(accessKeyId, accessKeySecret);
        com.aliyun.ocr20191230.models.RecognizePdfRequest recognizePdfRequest = new com.aliyun.ocr20191230.models.RecognizePdfRequest()
                .setFileURL("https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf");
        com.aliyun.teautil.models.RuntimeOptions runtime = new com.aliyun.teautil.models.RuntimeOptions();
        try {
            RecognizePdfResponse recognizePdfResponse = client.recognizePdfWithOptions(recognizePdfRequest, runtime);
            // 获取整体结果
            System.out.println(com.aliyun.teautil.Common.toJSONString(TeaModel.buildMap(recognizePdfResponse)));
            // 获取单个字段
            System.out.println(recognizePdfResponse.getBody());
        } catch (com.aliyun.tea.TeaException teaException) {
            // 获取整体报错信息
            System.out.println(com.aliyun.teautil.Common.toJSONString(teaException));
            // 获取单个字段
            System.out.println(teaException.getCode());
        }
    }
}
# -*- coding: utf-8 -*-
# 引入依赖包
# pip install alibabacloud_ocr20191230

import os
from alibabacloud_ocr20191230.client import Client
from alibabacloud_ocr20191230.models import RecognizePdfRequest
from alibabacloud_tea_openapi.models import Config
from alibabacloud_tea_util.models import RuntimeOptions

config = Config(
    # 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
    # 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
    # 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
    access_key_id=os.environ.get('ALIBABA_CLOUD_ACCESS_KEY_ID'),
    access_key_secret=os.environ.get('ALIBABA_CLOUD_ACCESS_KEY_SECRET'),
    # 访问的域名
    endpoint='ocr.cn-shanghai.aliyuncs.com',
    # 访问的域名对应的region
    region_id='cn-shanghai'
)
recognize_pdf_request = RecognizePdfRequest(
    file_url='https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf'
)
runtime = RuntimeOptions()
try:
  # 初始化Client
  client = Client(config)
  response = client.recognize_pdf_with_options(recognize_pdf_request, runtime)
  # 获取整体结果
  print(response.body)
except Exception as error:
  # 获取整体报错信息
  print(error)
  # 获取单个字段
  print(error.code)
  # tips: 可通过error.__dict__查看属性名称
<?php

//安装依赖包
//composer require alibabacloud/ocr-20191230

use AlibabaCloud\SDK\Ocr\V20191230\Ocr;
use \Exception;
use AlibabaCloud\Tea\Utils\Utils;
use Darabonba\OpenApi\Models\Config;
use AlibabaCloud\SDK\Ocr\V20191230\Models\RecognizePdfRequest;
use AlibabaCloud\Tea\Utils\Utils\RuntimeOptions;

class RecognizePdf {

    /**
     * 使用AK&SK初始化账号Client
     * @param string $accessKeyId
     * @param string $accessKeySecret
     * @return Ocr Client
     */
    public static function createClient($accessKeyId, $accessKeySecret){
        //初始化配置对象Darabonba\OpenApi\Models\Config。
        //Config对象存放accessKeyId、accessKeySecret、endpoint等配置
        $config = new Config([
            "accessKeyId" => $accessKeyId,
            "accessKeySecret" => $accessKeySecret
        ]);
        // 访问的域名
        $config->endpoint = "ocr.cn-shanghai.aliyuncs.com";
        return new Ocr($config);
    }

    /**
     * @param string[] $args
     * @return void
     */
    public static function main($args){
        // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
        // 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
        // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。    
        $accessKeyId = getenv('ALIBABA_CLOUD_ACCESS_KEY_ID');      
        $accessKeySecret = getenv('ALIBABA_CLOUD_ACCESS_KEY_SECRET');
        $client = self::createClient($accessKeyId, $accessKeySecret);
        $recognizePdfRequest = new RecognizePdfRequest([
            "fileURL" => "https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf"
        ]);
        $runtime = new RuntimeOptions([]);
        try {
            $resp = $client->recognizePdfWithOptions($recognizePdfRequest, $runtime);
            # 获取整体结果
            echo Utils::toJSONString($resp->body);
        } catch (Exception $exception) {
            # 获取整体报错信息
            echo Utils::toJSONString($exception);
            # 获取单个字段
            echo $exception->getCode();
        }
    }
}
$path = __DIR__ . \DIRECTORY_SEPARATOR . '..' . \DIRECTORY_SEPARATOR . 'vendor' . \DIRECTORY_SEPARATOR . 'autoload.php';
if (file_exists($path)) {
    require_once $path;
}
//$argv是预留的数组入参参数,无实际意义,无需进行修改
RecognizePdf::main(array_slice($argv, 1));
// 安装依赖包
// npm install @alicloud/ocr20191230
const OcrClient = require('@alicloud/ocr20191230');
const OpenapiClient = require('@alicloud/openapi-client');
const TeaUtil = require('@alicloud/tea-util');

let config = new OpenapiClient.Config({
    // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
    // 如果您用的是RAM用户AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
    // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。 
    accessKeyId: process.env.ALIBABA_CLOUD_ACCESS_KEY_ID,   
    accessKeySecret: process.env.ALIBABA_CLOUD_ACCESS_KEY_SECRET
});
// 访问的域名
config.endpoint = `ocr.cn-shanghai.aliyuncs.com`;
const client = new OcrClient.default(config);
let recognizePdfRequest = new OcrClient.RecognizePdfRequest({
  fileURL: "https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf",
});
let runtime = new TeaUtil.RuntimeOptions({ });
client.recognizePdfWithOptions(recognizePdfRequest, runtime)
  .then(function(recognizePdfResponse) {
    // 获取整体结果
    console.log(recognizePdfResponse);
    // 获取单个字段
    console.log(recognizePdfResponse.body.data);
  }, function(error) {
    // 获取整体报错信息
    console.log(error);
    // 获取单个字段
    console.log(error.data.Code);
  })
/**
依赖github.com/alibabacloud-go/ocr-20191230/v3
建议使用go mod tidy安装依赖
 */

import (
	"fmt"
	openapi "github.com/alibabacloud-go/darabonba-openapi/v2/client"
	ocr20191230 "github.com/alibabacloud-go/ocr-20191230/v3/client"
	util "github.com/alibabacloud-go/tea-utils/v2/service"
	"github.com/alibabacloud-go/tea/tea"
)

func main() {
     // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
     // 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
     // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。  
     accessKeyId := os.Getenv("ALIBABA_CLOUD_ACCESS_KEY_ID")  
     accessKeySecret := os.Getenv("ALIBABA_CLOUD_ACCESS_KEY_SECRET")
     // 初始化配置对象 &openapi.Config。Config对象存放AccessKeyId、AccessKeySecret、Endpoint等配置。
	   config := &openapi.Config{
		      AccessKeyId: tea.String(accessKeyId),
		      AccessKeySecret: tea.String(accessKeySecret)
	   }
	// 访问的域名
	config.Endpoint = tea.String("ocr.cn-shanghai.aliyuncs.com")
	client, err := ocr20191230.NewClient(config)
	if err != nil {
		panic(err)
	}
	recognizePdfRequest := &ocr20191230.RecognizePdfRequest{
		FileURL: tea.String("https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf"),
	}
	runtime := &util.RuntimeOptions{}
	recognizePdfResponse, err := client.RecognizePdfWithOptions(recognizePdfRequest, runtime)
	if err != nil {
		// 获取整体报错信息
		fmt.Println(err.Error())
	} else {
		// 获取整体结果
		fmt.Println(recognizePdfResponse)
	}
}
// 安装依赖包
// dotnet add package AlibabaCloud.SDK.Ocr20191230
using System;
using System.Collections;
using System.Collections.Generic;
using System.IO;
using System.Net;
using System.Threading.Tasks;
using AlibabaCloud.SDK.Ocr20191230.Models;
using Tea;
using Tea.Utils;

namespace AlibabaCloud.SDK.Sample
{
    public class Sample
    {
        /**
            * 使用AK&SK初始化账号Client
            * @param accessKeyId
            * @param accessKeySecret
            * @return Client
            * @throws Exception
        */
        public static AlibabaCloud.SDK.Ocr20191230.Client CreateClient(string accessKeyId, string accessKeySecret)
        {
            AlibabaCloud.OpenApiClient.Models.Config config = new AlibabaCloud.OpenApiClient.Models.Config
            {
                AccessKeyId = accessKeyId,
                AccessKeySecret = accessKeySecret,
            };
            // 访问的域名
            config.Endpoint = "ocr.cn-shanghai.aliyuncs.com";
            return new AlibabaCloud.SDK.Ocr20191230.Client(config);
        }
        public static void Main(string[] args)
        {
            // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html
            // 如果您使用的是RAM用户的AccessKey,还需要为子账号授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html
            // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
            AlibabaCloud.SDK.Ocr20191230.Client client = CreateClient(System.Environment.GetEnvironmentVariable("ALIBABA_CLOUD_ACCESS_KEY_ID"), System.Environment.GetEnvironmentVariable("ALIBABA_CLOUD_ACCESS_KEY_SECRET"));
            AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfRequest recognizePdfRequest = new AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfRequest
            {
                FileURL = "https://viapi-test.oss-cn-shanghai.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf",
            };
            AlibabaCloud.TeaUtil.Models.RuntimeOptions runtime = new AlibabaCloud.TeaUtil.Models.RuntimeOptions();
            try
            {
                AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfResponse recognizePdfResponse = client.RecognizePdfWithOptions(recognizePdfRequest, runtime);
                // 获取整体结果
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.ToJSONString(recognizePdfResponse.Body));
                // 获取单个字段
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.ToJSONString(recognizePdfResponse.Body.Data));
            }
            catch (TeaException error)
            {
                // 如有需要,请打印 error
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.AssertAsString(error.Message));
            }
            catch (Exception _error)
            {
                TeaException error = new TeaException(new Dictionary<string, object>
              {
                { "message", _error.Message }
              });
                // 如有需要,请打印 error
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.AssertAsString(error.Message));
            }
        }
    }
}

文件在本地或可访问的URL

/*
引入依赖包
<!-- https://mvnrepository.com/artifact/com.aliyun/ocr20191230 -->
<dependency>
  	<groupId>com.aliyun</groupId>
  	<artifactId>ocr20191230</artifactId>
  	<version>${aliyun.ocr.version}</version>
</dependency>
*/

import com.aliyun.ocr20191230.models.RecognizePdfResponse;
import com.aliyun.tea.TeaModel;

import java.io.InputStream;
import java.net.URL;

public class RecognizePdf {
    public static com.aliyun.ocr20191230.Client createClient(String accessKeyId, String accessKeySecret) throws Exception {
        /*
          初始化配置对象com.aliyun.teaopenapi.models.Config
          Config对象存放 AccessKeyId、AccessKeySecret、endpoint等配置
         */
         com.aliyun.teaopenapi.models.Config config = new com.aliyun.teaopenapi.models.Config()
                .setAccessKeyId(accessKeyId)
                .setAccessKeySecret(accessKeySecret);
        // 访问的域名
        config.endpoint = "ocr.cn-shanghai.aliyuncs.com";
        return new com.aliyun.ocr20191230.Client(config);
    }

    public static void main(String[] args_) throws Exception {
        // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html
        // 如果您使用的是RAM用户的AccessKey,还需要为子账号授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html
        // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
        String accessKeyId = System.getenv("ALIBABA_CLOUD_ACCESS_KEY_ID");
        String accessKeySecret = System.getenv("ALIBABA_CLOUD_ACCESS_KEY_SECRET"); 
        com.aliyun.ocr20191230.Client client = RecognizePdf.createClient(accessKeyId, accessKeySecret);
        // 场景一,使用本地文件
        // InputStream inputStream = new FileInputStream(new File("/tmp/recognizePdf1.pdf"));
        // 场景二,使用任意可访问的url
        URL url = new URL("https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf");
        InputStream inputStream = url.openConnection().getInputStream();
        com.aliyun.ocr20191230.models.RecognizePdfAdvanceRequest recognizePdfAdvanceRequest = new com.aliyun.ocr20191230.models.RecognizePdfAdvanceRequest()
                .setFileURLObject(inputStream);
        com.aliyun.teautil.models.RuntimeOptions runtime = new com.aliyun.teautil.models.RuntimeOptions();
        try {
            RecognizePdfResponse recognizePdfResponse = client.recognizePdfAdvance(recognizePdfAdvanceRequest, runtime);
            // 获取整体结果
            System.out.println(com.aliyun.teautil.Common.toJSONString(TeaModel.buildMap(recognizePdfResponse)));
            // 获取单个字段
            System.out.println(recognizePdfResponse.getBody());
        } catch (com.aliyun.tea.TeaException teaException) {
            // 获取整体报错信息
            System.out.println(com.aliyun.teautil.Common.toJSONString(teaException));
            // 获取单个字段
            System.out.println(teaException.getCode());
        }
    }
}
# -*- coding: utf-8 -*-
# 引入依赖包
# pip install alibabacloud_ocr20191230

import os
import io
from urllib.request import urlopen
from alibabacloud_ocr20191230.client import Client
from alibabacloud_ocr20191230.models import RecognizePdfAdvanceRequest
from alibabacloud_tea_openapi.models import Config
from alibabacloud_tea_util.models import RuntimeOptions

config = Config(
    # 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
    # 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
    # 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
    access_key_id=os.environ.get('ALIBABA_CLOUD_ACCESS_KEY_ID'),
    access_key_secret=os.environ.get('ALIBABA_CLOUD_ACCESS_KEY_SECRET'),
    # 访问的域名
    endpoint='ocr.cn-shanghai.aliyuncs.com',
    # 访问的域名对应的region
    region_id='cn-shanghai'
)
#场景一:文件在本地
#stream = open(r'/tmp/RecognizePdf1.pdf', 'rb')
#recognize_pdf_request = RecognizePdfAdvanceRequest()
#recognize_pdf_request.file_urlobject = stream

#场景二:使用任意可访问的url
url = 'https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf'
img = urlopen(url).read()
recognize_pdf_request = RecognizePdfAdvanceRequest()
recognize_pdf_request.file_urlobject = io.BytesIO(img)
runtime = RuntimeOptions()
try:
  # 初始化Client
  client = Client(config)
  response = client.recognize_pdf_advance(recognize_pdf_request, runtime)
  # 获取整体结果
  print(response.body)
except Exception as error:
  # 获取整体报错信息
  print(error)
  # 获取单个字段
  print(error.code)
  # tips: 可通过error.__dict__查看属性名称

#关闭流
#stream.close()
<?php

//安装依赖包
//composer require alibabacloud/ocr-20191230

use AlibabaCloud\SDK\Ocr\V20191230\Ocr;
use AlibabaCloud\Tea\Utils\Utils;
use \Exception;
use Darabonba\OpenApi\Models\Config;
use AlibabaCloud\SDK\Ocr\V20191230\Models\RecognizePdfAdvanceRequest;
use AlibabaCloud\Tea\Utils\Utils\RuntimeOptions;
use GuzzleHttp\Psr7\Stream;

class RecognizePdfAdvance {

    /**
     * 使用AK&SK初始化账号Client
     * @param string $accessKeyId
     * @param string $accessKeySecret
     * @return Ocr Client
     */
    public static function createClient($accessKeyId, $accessKeySecret){
        //初始化配置对象Darabonba\OpenApi\Models\Config。
        //Config对象存放accessKeyId、accessKeySecret、endpoint等配置
        $config = new Config([
            "accessKeyId" => $accessKeyId,
            "accessKeySecret" => $accessKeySecret
        ]);
        // 访问的域名
        $config->endpoint = "ocr.cn-shanghai.aliyuncs.com";
        return new Ocr($config);
    }

    /**
     * @param string[] $args
     * @return void
     */
    public static function main($args){
        // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
        // 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
        // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。    
        $accessKeyId = getenv('ALIBABA_CLOUD_ACCESS_KEY_ID');      
        $accessKeySecret = getenv('ALIBABA_CLOUD_ACCESS_KEY_SECRET');
        $client = self::createClient($accessKeyId, $accessKeySecret);
        // 场景一,使用本地文件
        //$file = fopen('/tmp/RecognizePdf1.pdf', 'rb');
        //$stream = new Stream($file);
        // 场景二,使用任意可访问的url
        $file = fopen('https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf', 'rb');
        $stream = new Stream($file);
        $recognizePdfAdvanceRequest = new RecognizePdfAdvanceRequest([
            "fileURLObject" => $stream
        ]);
        $runtime = new RuntimeOptions([]);
        // 复制代码运行请自行打印 API 的返回值
       try {
            $resp = $client->recognizePdfAdvance($recognizePdfAdvanceRequest, $runtime);
            # 获取整体结果
            echo Utils::toJSONString($resp->body);
        } catch (Exception $exception) {
            # 获取整体报错信息
            echo Utils::toJSONString($exception);
            # 获取单个字段
            echo $exception->getCode();
        }
    }
}
$path = __DIR__ . \DIRECTORY_SEPARATOR . '..' . \DIRECTORY_SEPARATOR . 'vendor' . \DIRECTORY_SEPARATOR . 'autoload.php';
if (file_exists($path)) {
    require_once $path;
}
//$argv是预留的数组入参参数,无实际意义,无需进行修改
RecognizePdfAdvance::main(array_slice($argv, 1));
// 安装依赖包
// npm install @alicloud/ocr20191230
const OcrClient = require('@alicloud/ocr20191230');
const OpenapiClient = require('@alicloud/openapi-client');
const TeaUtil = require('@alicloud/tea-util');
const fs = require('fs');
const http = require('http');
const https = require('https');

let config = new OpenapiClient.Config({
    // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
    // 如果您用的是RAM用户AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
    // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。 
    accessKeyId: process.env.ALIBABA_CLOUD_ACCESS_KEY_ID,   
    accessKeySecret: process.env.ALIBABA_CLOUD_ACCESS_KEY_SECRET
});
// 访问的域名
config.endpoint = `ocr.cn-shanghai.aliyuncs.com`;
const client = new OcrClient.default(config);
const getResponse = function (httpClient, url) {
  return new Promise((resolve, reject) => {
    httpClient.get(url, function (response) {
      resolve(response);
    })
  })
}
const request = async function () {
  try {
    let recognizePdfAdvanceRequest = new OcrClient.RecognizePdfAdvanceRequest();
    // 场景一,使用本地文件
    // const fileStream = fs.createReadStream('/tmp/RecognizePdf1.pdf');
    // recognizePdfAdvanceRequest.fileURLObject = fileStream;
    // 场景二,使用任意可访问的url
    const url = new URL("https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf");
    const httpClient = (url.protocol == "https:") ? https : http;
    recognizePdfAdvanceRequest.fileURLObject = await getResponse(httpClient, url);
    let runtime = new TeaUtil.RuntimeOptions({});
    client.recognizePdfAdvance(recognizePdfAdvanceRequest, runtime)
      .then(function (recognizePdfResponse) {
        // 获取整体结果
        console.log(recognizePdfResponse);
        // 获取单个字段
        console.log(recognizePdfResponse.body.data);
      }, function (error) {
        // 获取整体报错信息
        console.log(error);
        // 获取单个字段
        console.log(error.data.Code);
      })
  } catch (error) {
    console.log(error);
  }
}();
/**
依赖github.com/alibabacloud-go/ocr-20191230/v3
建议使用go mod tidy安装依赖
 */

import (
	"fmt"
	openapi "github.com/alibabacloud-go/darabonba-openapi/v2/client"
	ocr20191230 "github.com/alibabacloud-go/ocr-20191230/v3/client"
	util "github.com/alibabacloud-go/tea-utils/v2/service"
	"github.com/alibabacloud-go/tea/tea"
	"net/http"
)

func main() {  
     // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html。
     // 如果您用的是RAM用户的AccessKey,还需要为RAM用户授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html。
     // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行示例前必须先配置环境变量。  
     accessKeyId := os.Getenv("ALIBABA_CLOUD_ACCESS_KEY_ID")  
     accessKeySecret := os.Getenv("ALIBABA_CLOUD_ACCESS_KEY_SECRET")
     // 初始化配置对象 &openapi.Config。Config对象存放AccessKeyId、AccessKeySecret、Endpoint等配置。
	   config := &openapi.Config{
		      AccessKeyId: tea.String(accessKeyId),
		      AccessKeySecret: tea.String(accessKeySecret)
	   }
	// 访问的域名
	config.Endpoint = tea.String("ocr.cn-shanghai.aliyuncs.com")
	client, err := ocr20191230.NewClient(config)
	if err != nil {
		panic(err)
	}
	// 场景一,使用本地文件
	//file, err := os.Open("/tmp/RecognizePdf1.pdf")
	//if err != nil {
	//	fmt.Println("can not open file", err)
	//	panic(err)
	//}
	//recognizePdfAdvanceRequest := &ocr20191230.RecognizePdfAdvanceRequest{
	//	FileURLObject: file,
	//}
	//场景二,使用任意可访问的url
	httpClient := http.Client{}
	file, _ := httpClient.Get("https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf")
	recognizePdfAdvanceRequest := &ocr20191230.RecognizePdfAdvanceRequest{
		FileURLObject: file.Body,
	}
	runtime := &util.RuntimeOptions{}
	recognizePdfAdvanceResponse, err := client.RecognizePdfAdvance(recognizePdfAdvanceRequest, runtime)
	if err != nil {
		// 获取整体报错信息
		fmt.Println(err.Error())
	} else {
		// 获取整体结果
		fmt.Println(recognizePdfAdvanceResponse)
	}
}
// 安装依赖包
// dotnet add package AlibabaCloud.SDK.Ocr20191230
using System;
using System.Collections;
using System.Collections.Generic;
using System.IO;
using System.Net;
using System.Threading.Tasks;
using AlibabaCloud.SDK.Ocr20191230.Models;
using Tea;
using Tea.Utils;
using static System.Net.WebRequestMethods;

namespace AlibabaCloud.SDK.Sample
{
public class Sample
    {

        /**
* 使用AK&SK初始化账号Client
* @param accessKeyId
* @param accessKeySecret
* @return Client
* @throws Exception
*/
        public static AlibabaCloud.SDK.Ocr20191230.Client CreateClient(string accessKeyId, string accessKeySecret)
        {
            AlibabaCloud.OpenApiClient.Models.Config config = new AlibabaCloud.OpenApiClient.Models.Config
            {
                AccessKeyId = AccessKeyId,
                AccessKeySecret = AccessKeySecret,
            };
            // 访问的域名
            config.Endpoint = "ocr.cn-shanghai.aliyuncs.com";
            return new AlibabaCloud.SDK.Ocr20191230.Client(config);
        }
        public static void Main(string[] args)
        {
            // 创建AccessKey ID和AccessKey Secret,请参考https://help.aliyun.com/document_detail/175144.html
            // 如果您使用的是RAM用户的AccessKey,还需要为子账号授予权限AliyunVIAPIFullAccess,请参考https://help.aliyun.com/document_detail/145025.html
            // 从环境变量读取配置的AccessKey ID和AccessKey Secret。运行代码示例前必须先配置环境变量。
            AlibabaCloud.SDK.Ocr20191230.Client client = CreateClient(System.Environment.GetEnvironmentVariable("ALIBABA_CLOUD_ACCESS_KEY_ID"), System.Environment.GetEnvironmentVariable("ALIBABA_CLOUD_ACCESS_KEY_SECRET"));
            AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfAdvanceRequest recognizePdfAdvanceRequest = new AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfAdvanceRequest
            ();
            /* 场景一,使用本地文件
            System.IO.StreamReader file = new System.IO.StreamReader(@"/tmp/RecognizePdf1.pdf");
            recognizePdfAdvanceRequest.FileURLObject = file.BaseStream;
            */
            // 场景二,使用任意可访问的url
            HttpWebRequest request = (HttpWebRequest)WebRequest.Create("https://viapi-test-bj.oss-cn-beijing.aliyuncs.com/viapi-3.0domepic/ocr/RecognizePdf/RecognizePdf1.pdf");
            WebResponse response = request.GetResponse();
            Stream stream = response.GetResponseStream();
            recognizePdfAdvanceRequest.FileURLObject = stream;
            AlibabaCloud.TeaUtil.Models.RuntimeOptions runtime = new AlibabaCloud.TeaUtil.Models.RuntimeOptions();
            try
            {
                AlibabaCloud.SDK.Ocr20191230.Models.RecognizePdfResponse recognizePdfResponse = client.RecognizePdfAdvance(recognizePdfAdvanceRequest, runtime);
                // 获取整体结果
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.ToJSONString(recognizePdfResponse.Body));
                // 获取单个字段
                Console.WriteLine(AlibabaCloud.TeaUtil.Common.ToJSONString(recognizePdfResponse.Body.Data));
            }
            catch (TeaException error)
            {
                // 如有需要,请打印 error
                AlibabaCloud.TeaUtil.Common.AssertAsString(error.Message);
            }
            catch (Exception _error)
            {
                TeaException error = new TeaException(new Dictionary<string, object>
                {
                    { "message", _error.Message }
                });
                // 如有需要,请打印 error
                Console.WriteLine(error.Message);
            }
        }
    }
}