Skip to content

PDF转为文档

将PDF转换为文档格式。测试应用仅开放转换前三页。

注意

PDF转换为文档支持的最大文档尺寸为100M,超出的大文件建议进行拆分处理

目前支持转换为的文档类型:

文档类型扩展名
文字
docx
表格
xlsx
演示
pptx
表格提取
table
JSON
json

基本信息

请求路径:POST /api/developer/v1/office/pdf/convert/to/:office_type

参数必须类型说明
Date
string
使用 RFC1123 时间格式的当前时间
Content-Md5
string
HTTP Body 中数据的 MD5 值十六进制表达方式, 必需小写, 如果是 get 请求一律使用 URI 计算 MD5
Content-Type
string
目前固定为: application/json
Authorization
string
"WPS-2:" + app_id + ":" + sha1( app_key + Content-Md5 + Content-Type + DATE)

Path 参数

参数必须类型说明
office_type
string
转换为的文件类型:docx,xlsx,pptx,table,json

Body 参数

参数必须类型说明
url
string
文档下载地址(pdf url ,zip url,根据后缀判断.pdf 或者.zip)
page_num_begin
integer
转换起始页,起始值为1。eg: [1, 3] 转换1~3页,都为0转换整个文档。
page_num_end
integer
转换的结束页
text_unify
boolean
统一段落字体字号,建议传true
sheet_option
integer
转换为表格时配置:sheet转换方式 0表示每页pdf(每页图片)一个sheet, 1表示所有页面(图片)转到一个sheet中, 默认为0
export_type
string
表格提取时配置,输出类型:xlsx,html,默认为html

返回参数

参数必须类型说明
code
integer
错误码
+
data
data {}
响应数据

示例

请求示例

curl --request POST \
	--url https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx \
	--header 'Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a' \
	--header 'Content-Md5: d41d8cd98f00b204e9800998ecf8427e' \
	--header 'Content-Type: application/json' \
	--header 'Date: Wed, 23 Jan 2013 06:43:08 GMT' \
	--data '{"url":"https://***.com/***"}'
OkHttpClient client = new OkHttpClient();

MediaType mediaType = MediaType.parse("application/json");
RequestBody body = RequestBody.create(mediaType, "{\"url\":\"https://***.com/***\"}");
Request request = new Request.Builder()
	.url("https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx")
	.post(body)
	.addHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT")
	.addHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e")
	.addHeader("Content-Type", "application/json")
	.addHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a")
	.build();

Response response = client.newCall(request).execute();
package main

import (
	"fmt"
	"strings"
	"net/http"
	"io/ioutil"
)

func main() {

	url := "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx"

	payload := strings.NewReader("{\"url\":\"https://***.com/***\"}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Date", "Wed, 23 Jan 2013 06:43:08 GMT")
	req.Header.Add("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e")
	req.Header.Add("Content-Type", "application/json")
	req.Header.Add("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := ioutil.ReadAll(res.Body)

	fmt.Println(res)
	fmt.Println(string(body))

}
import http.client

conn = http.client.HTTPSConnection("solution.wps.cn")

payload = "{\"url\":\"https://***.com/***\"}"

headers = {
    'Date': "Wed, 23 Jan 2013 06:43:08 GMT",
    'Content-Md5': "d41d8cd98f00b204e9800998ecf8427e",
    'Content-Type': "application/json",
    'Authorization': "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a"
    }

conn.request("POST", "/api/developer/v1/office/pdf/convert/to/docx", payload, headers)

res = conn.getresponse()
data = res.read()

print(data.decode("utf-8"))
<?php

$curl = curl_init();

curl_setopt_array($curl, [
	CURLOPT_URL => "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx",
	CURLOPT_RETURNTRANSFER => true,
	CURLOPT_ENCODING => "",
	CURLOPT_MAXREDIRS => 10,
	CURLOPT_TIMEOUT => 30,
	CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
	CURLOPT_CUSTOMREQUEST => "POST",
	CURLOPT_POSTFIELDS => "{\"url\":\"https://***.com/***\"}",
	CURLOPT_HTTPHEADER => [
		"Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a",
		"Content-Md5: d41d8cd98f00b204e9800998ecf8427e",
		"Content-Type: application/json",
		"Date: Wed, 23 Jan 2013 06:43:08 GMT"
	],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
	echo "cURL Error #:" . $err;
} else {
	echo $response;
}
const data = JSON.stringify({
	"url": "https://***.com/***"
});

const xhr = new XMLHttpRequest();
xhr.withCredentials = true;

xhr.addEventListener("readystatechange", function () {
	if (this.readyState === this.DONE) {
		console.log(this.responseText);
	}
});

xhr.open("POST", "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");
xhr.setRequestHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT");
xhr.setRequestHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e");
xhr.setRequestHeader("Content-Type", "application/json");
xhr.setRequestHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");

xhr.send(data);
const http = require("https");

const options = {
	"method": "POST",
	"hostname": "solution.wps.cn",
	"port": null,
	"path": "/api/developer/v1/office/pdf/convert/to/docx",
	"headers": {
		"Date": "Wed, 23 Jan 2013 06:43:08 GMT",
		"Content-Md5": "d41d8cd98f00b204e9800998ecf8427e",
		"Content-Type": "application/json",
		"Authorization": "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a"
	}
};

const req = http.request(options, function (res) {
	const chunks = [];

	res.on("data", function (chunk) {
		chunks.push(chunk);
	});

	res.on("end", function () {
		const body = Buffer.concat(chunks);
		console.log(body.toString());
	});
});

req.write(JSON.stringify({url: 'https://***.com/***'}));
req.end();
CURL *hnd = curl_easy_init();

curl_easy_setopt(hnd, CURLOPT_CUSTOMREQUEST, "POST");
curl_easy_setopt(hnd, CURLOPT_URL, "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");

struct curl_slist *headers = NULL;
headers = curl_slist_append(headers, "Date: Wed, 23 Jan 2013 06:43:08 GMT");
headers = curl_slist_append(headers, "Content-Md5: d41d8cd98f00b204e9800998ecf8427e");
headers = curl_slist_append(headers, "Content-Type: application/json");
headers = curl_slist_append(headers, "Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");
curl_easy_setopt(hnd, CURLOPT_HTTPHEADER, headers);

curl_easy_setopt(hnd, CURLOPT_POSTFIELDS, "{\"url\":\"https://***.com/***\"}");

CURLcode ret = curl_easy_perform(hnd);
var client = new RestClient("https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");
var request = new RestRequest(Method.POST);
request.AddHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT");
request.AddHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e");
request.AddHeader("Content-Type", "application/json");
request.AddHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");
request.AddParameter("application/json", "{\"url\":\"https://***.com/***\"}", ParameterType.RequestBody);
IRestResponse response = client.Execute(request);

返回示例

json
{
    "code": 0,
    "data": {
        "task_id": "0f27ff302780428e9ddfd39189731891"
    }
}

查询异步任务结果

携带 task_id 查询结果

提示

task_id 有效期1个小时。超过一个小时,将自动删除本次转换结果缓存,请及时保存相关转换结果及文件。

错误码

请参考错误码说明