主题
PDF转为文档
将PDF转换为文档格式。测试应用仅开放转换前三页。
注意
PDF转换为文档支持的最大文档尺寸为100M,超出的大文件建议进行拆分处理
目前支持转换为的文档类型:
文档类型 | 扩展名 |
---|---|
文字 | docx |
表格 | xlsx |
演示 | pptx |
表格提取 | table |
JSON | json |
基本信息
请求路径:POST /api/developer/v1/office/pdf/convert/to/:office_type
Header 参数
参数 | 必须 | 类型 | 说明 |
---|---|---|---|
Date | 是 | string | 使用 RFC1123 时间格式的当前时间 |
Content-Md5 | 是 | string | HTTP Body 中数据的 MD5 值十六进制表达方式, 必需小写, 如果是 get 请求一律使用 URI 计算 MD5 |
Content-Type | 是 | string | 目前固定为: application/json |
Authorization | 是 | string | "WPS-2:" + app_id + ":" + sha1( app_key + Content-Md5 + Content-Type + DATE ) |
Path 参数
参数 | 必须 | 类型 | 说明 |
---|---|---|---|
office_type | 是 | string | 转换为的文件类型: docx ,xlsx ,pptx ,table ,json |
Body 参数
参数 | 必须 | 类型 | 说明 |
---|---|---|---|
url | 是 | string | 文档下载地址(pdf url ,zip url,根据后缀判断.pdf 或者.zip) |
page_num_begin | 否 | integer | 转换起始页,起始值为1。eg: [1, 3] 转换1~3页,都为0转换整个文档。 |
page_num_end | 否 | integer | 转换的结束页 |
text_unify | 否 | boolean | 统一段落字体字号,建议传true |
sheet_option | 否 | integer | 转换为表格 时配置:sheet转换方式 0表示每页pdf(每页图片)一个sheet, 1表示所有页面(图片)转到一个sheet中, 默认为0 |
export_type | 否 | string | 表格提取 时配置,输出类型:xlsx,html,默认为html |
返回参数
参数 | 必须 | 类型 | 说明 |
---|---|---|---|
code | 是 | integer | 错误码 |
data | 是 | data {} | 响应数据 |
示例
请求示例
curl --request POST \
--url https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx \
--header 'Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a' \
--header 'Content-Md5: d41d8cd98f00b204e9800998ecf8427e' \
--header 'Content-Type: application/json' \
--header 'Date: Wed, 23 Jan 2013 06:43:08 GMT' \
--data '{"url":"https://***.com/***"}'
OkHttpClient client = new OkHttpClient();
MediaType mediaType = MediaType.parse("application/json");
RequestBody body = RequestBody.create(mediaType, "{\"url\":\"https://***.com/***\"}");
Request request = new Request.Builder()
.url("https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx")
.post(body)
.addHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT")
.addHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e")
.addHeader("Content-Type", "application/json")
.addHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a")
.build();
Response response = client.newCall(request).execute();
package main
import (
"fmt"
"strings"
"net/http"
"io/ioutil"
)
func main() {
url := "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx"
payload := strings.NewReader("{\"url\":\"https://***.com/***\"}")
req, _ := http.NewRequest("POST", url, payload)
req.Header.Add("Date", "Wed, 23 Jan 2013 06:43:08 GMT")
req.Header.Add("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e")
req.Header.Add("Content-Type", "application/json")
req.Header.Add("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a")
res, _ := http.DefaultClient.Do(req)
defer res.Body.Close()
body, _ := ioutil.ReadAll(res.Body)
fmt.Println(res)
fmt.Println(string(body))
}
import http.client
conn = http.client.HTTPSConnection("solution.wps.cn")
payload = "{\"url\":\"https://***.com/***\"}"
headers = {
'Date': "Wed, 23 Jan 2013 06:43:08 GMT",
'Content-Md5': "d41d8cd98f00b204e9800998ecf8427e",
'Content-Type': "application/json",
'Authorization': "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a"
}
conn.request("POST", "/api/developer/v1/office/pdf/convert/to/docx", payload, headers)
res = conn.getresponse()
data = res.read()
print(data.decode("utf-8"))
<?php
$curl = curl_init();
curl_setopt_array($curl, [
CURLOPT_URL => "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx",
CURLOPT_RETURNTRANSFER => true,
CURLOPT_ENCODING => "",
CURLOPT_MAXREDIRS => 10,
CURLOPT_TIMEOUT => 30,
CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
CURLOPT_CUSTOMREQUEST => "POST",
CURLOPT_POSTFIELDS => "{\"url\":\"https://***.com/***\"}",
CURLOPT_HTTPHEADER => [
"Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a",
"Content-Md5: d41d8cd98f00b204e9800998ecf8427e",
"Content-Type: application/json",
"Date: Wed, 23 Jan 2013 06:43:08 GMT"
],
]);
$response = curl_exec($curl);
$err = curl_error($curl);
curl_close($curl);
if ($err) {
echo "cURL Error #:" . $err;
} else {
echo $response;
}
const data = JSON.stringify({
"url": "https://***.com/***"
});
const xhr = new XMLHttpRequest();
xhr.withCredentials = true;
xhr.addEventListener("readystatechange", function () {
if (this.readyState === this.DONE) {
console.log(this.responseText);
}
});
xhr.open("POST", "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");
xhr.setRequestHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT");
xhr.setRequestHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e");
xhr.setRequestHeader("Content-Type", "application/json");
xhr.setRequestHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");
xhr.send(data);
const http = require("https");
const options = {
"method": "POST",
"hostname": "solution.wps.cn",
"port": null,
"path": "/api/developer/v1/office/pdf/convert/to/docx",
"headers": {
"Date": "Wed, 23 Jan 2013 06:43:08 GMT",
"Content-Md5": "d41d8cd98f00b204e9800998ecf8427e",
"Content-Type": "application/json",
"Authorization": "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a"
}
};
const req = http.request(options, function (res) {
const chunks = [];
res.on("data", function (chunk) {
chunks.push(chunk);
});
res.on("end", function () {
const body = Buffer.concat(chunks);
console.log(body.toString());
});
});
req.write(JSON.stringify({url: 'https://***.com/***'}));
req.end();
CURL *hnd = curl_easy_init();
curl_easy_setopt(hnd, CURLOPT_CUSTOMREQUEST, "POST");
curl_easy_setopt(hnd, CURLOPT_URL, "https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");
struct curl_slist *headers = NULL;
headers = curl_slist_append(headers, "Date: Wed, 23 Jan 2013 06:43:08 GMT");
headers = curl_slist_append(headers, "Content-Md5: d41d8cd98f00b204e9800998ecf8427e");
headers = curl_slist_append(headers, "Content-Type: application/json");
headers = curl_slist_append(headers, "Authorization: WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");
curl_easy_setopt(hnd, CURLOPT_HTTPHEADER, headers);
curl_easy_setopt(hnd, CURLOPT_POSTFIELDS, "{\"url\":\"https://***.com/***\"}");
CURLcode ret = curl_easy_perform(hnd);
var client = new RestClient("https://solution.wps.cn/api/developer/v1/office/pdf/convert/to/docx");
var request = new RestRequest(Method.POST);
request.AddHeader("Date", "Wed, 23 Jan 2013 06:43:08 GMT");
request.AddHeader("Content-Md5", "d41d8cd98f00b204e9800998ecf8427e");
request.AddHeader("Content-Type", "application/json");
request.AddHeader("Authorization", "WPS-2:******:ac59dac1460772a04b3a97d7ef78409f28241e3a");
request.AddParameter("application/json", "{\"url\":\"https://***.com/***\"}", ParameterType.RequestBody);
IRestResponse response = client.Execute(request);
返回示例
json
{
"code": 0,
"data": {
"task_id": "0f27ff302780428e9ddfd39189731891"
}
}
查询异步任务结果
携带 task_id 查询结果
提示
task_id 有效期1个小时。超过一个小时,将自动删除本次转换结果缓存,请及时保存相关转换结果及文件。
错误码
请参考错误码说明