Create document

Create document

curl --request POST \
  --url https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document \
  --header 'Content-Type: application/json' \
  --header 'authorization: <api-key>' \
  --data '
{
  "data": {
    "type": "url",
    "url": "<string>",
    "name": "<string>",
    "folderID": "<string>",
    "documentMetadata": [
      {
        "key": "<string>",
        "values": [
          "<string>"
        ]
      }
    ],
    "metadata": {},
    "projectEnvironmentIDOrAlias": "<string>"
  }
}
'

import requests

url = "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document"

payload = { "data": {
        "type": "url",
        "url": "<string>",
        "name": "<string>",
        "folderID": "<string>",
        "documentMetadata": [
            {
                "key": "<string>",
                "values": ["<string>"]
            }
        ],
        "metadata": {},
        "projectEnvironmentIDOrAlias": "<string>"
    } }
headers = {
    "authorization": "<api-key>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {authorization: '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    data: {
      type: 'url',
      url: '<string>',
      name: '<string>',
      folderID: '<string>',
      documentMetadata: [{key: '<string>', values: ['<string>']}],
      metadata: {},
      projectEnvironmentIDOrAlias: '<string>'
    }
  })
};

fetch('https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'data' => [
        'type' => 'url',
        'url' => '<string>',
        'name' => '<string>',
        'folderID' => '<string>',
        'documentMetadata' => [
                [
                                'key' => '<string>',
                                'values' => [
                                                                '<string>'
                                ]
                ]
        ],
        'metadata' => [
                
        ],
        'projectEnvironmentIDOrAlias' => '<string>'
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "authorization: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document"

	payload := strings.NewReader("{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("authorization", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document")
  .header("authorization", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["authorization"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "data": {
    "documentID": "<string>",
    "data": {
      "type": "url",
      "name": "<string>",
      "url": "<string>",
      "lastSuccessUpdate": "<string>",
      "accessTokenID": 123,
      "integrationExternalID": "<string>"
    },
    "updatedAt": "2023-11-07T05:31:56Z",
    "status": {
      "data": "<unknown>"
    }
  }
}

POST

v1alpha1

public

knowledge-base

document

Create document

curl --request POST \
  --url https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document \
  --header 'Content-Type: application/json' \
  --header 'authorization: <api-key>' \
  --data '
{
  "data": {
    "type": "url",
    "url": "<string>",
    "name": "<string>",
    "folderID": "<string>",
    "documentMetadata": [
      {
        "key": "<string>",
        "values": [
          "<string>"
        ]
      }
    ],
    "metadata": {},
    "projectEnvironmentIDOrAlias": "<string>"
  }
}
'

import requests

url = "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document"

payload = { "data": {
        "type": "url",
        "url": "<string>",
        "name": "<string>",
        "folderID": "<string>",
        "documentMetadata": [
            {
                "key": "<string>",
                "values": ["<string>"]
            }
        ],
        "metadata": {},
        "projectEnvironmentIDOrAlias": "<string>"
    } }
headers = {
    "authorization": "<api-key>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {authorization: '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    data: {
      type: 'url',
      url: '<string>',
      name: '<string>',
      folderID: '<string>',
      documentMetadata: [{key: '<string>', values: ['<string>']}],
      metadata: {},
      projectEnvironmentIDOrAlias: '<string>'
    }
  })
};

fetch('https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'data' => [
        'type' => 'url',
        'url' => '<string>',
        'name' => '<string>',
        'folderID' => '<string>',
        'documentMetadata' => [
                [
                                'key' => '<string>',
                                'values' => [
                                                                '<string>'
                                ]
                ]
        ],
        'metadata' => [
                
        ],
        'projectEnvironmentIDOrAlias' => '<string>'
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "authorization: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document"

	payload := strings.NewReader("{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("authorization", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document")
  .header("authorization", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://realtime-api.voiceflow.com/v1alpha1/public/knowledge-base/document")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["authorization"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"data\": {\n    \"type\": \"url\",\n    \"url\": \"<string>\",\n    \"name\": \"<string>\",\n    \"folderID\": \"<string>\",\n    \"documentMetadata\": [\n      {\n        \"key\": \"<string>\",\n        \"values\": [\n          \"<string>\"\n        ]\n      }\n    ],\n    \"metadata\": {},\n    \"projectEnvironmentIDOrAlias\": \"<string>\"\n  }\n}"

response = http.request(request)
puts response.read_body

{
  "data": {
    "documentID": "<string>",
    "data": {
      "type": "url",
      "name": "<string>",
      "url": "<string>",
      "lastSuccessUpdate": "<string>",
      "accessTokenID": 123,
      "integrationExternalID": "<string>"
    },
    "updatedAt": "2023-11-07T05:31:56Z",
    "status": {
      "data": "<unknown>"
    }
  }
}

Authorizations

authorization

string

header

required

Voiceflow API key

Headers

content-type

string

Query Parameters

maxChunkSize

Determines how granularly each document is broken up. Range available is 500-1500 tokens, default is 1000. Smaller chunk size means narrower context, faster response, less tokens consumed, and greater risk of less accurate answers. Max chunk size affects the total amount of chunks parsed from a document - i.e., larger chunks means less chunks retrieved.

overwrite

If set to true, the existing table with the same name will be overwritten.

markdownConversion

When enabled, HTML is automatically converted to markdown to generate better chunks.

llmBasedChunks

llmGeneratedQ

When enabled, an LLM will be used to generate a question based on the document context and specific chunk, then prepend it to the chunk. This enhances retrieval by aligning chunks with potential user queries.

llmContentSummarization

When enabled, an LLM summarizes and rewrites the content, removing unnecessary information and focusing on important parts to optimize for retrieval. Limited to 15 rows per table upload.

llmPrependContext

When enabled, an LLM generates a context summary based on the document and chunk context, and prepends it to each chunk. This improves retrieval by providing additional context to each chunk. Note: If both llmGeneratedQ and llmPrependContext are set to true, llmGeneratedQ takes precedence, and the context summarization will not be applied.

Body

data

object

required

Hide child attributes

data.type

enum<string>

required

Available options:

url

data.url

string

required

data.name

string

data.refreshRate

enum<string>

Available options:

daily,

weekly,

monthly,

never

data.folderID

string

data.documentMetadata

object[]

An array of document metadata fields.

💡 Tip: This metadata can be used in agent KB metadata filter conditions. Learn more about metadata filtering.

Hide child attributes

data.documentMetadata.key

string

required

Maximum string length: 255

data.documentMetadata.values

string[]

required

data.metadata

object

Chunk-level metadata that can be used in a KB API query request.

⚠️ Warning: This metadata can't be used in agent KB metadata filter conditions. Use documentMetadata instead if you need agent-level metadata filtering.

Hide child attributes

data.metadata.{key}

any

data.projectEnvironmentIDOrAlias

string

The alias of the environment to target (ie. main). You can find this in the environments page of your agent.

💡 Tip: Learn more about Environments.

Response

The document was created successfully.

data

object

required

Hide child attributes

data.documentID

string

required

data.data

object | null

required

Hide child attributes

data.data.type

enum<string>

required

Available options:

url

data.data.name

string

required

data.data.url

string

required

data.data.refreshRate

enum<string>

Available options:

daily,

weekly,

monthly,

never

data.data.lastSuccessUpdate

string

data.data.accessTokenID

number

data.data.integrationExternalID

string

data.data.source

enum<string>

Available options:

zendesk,

shopify

data.updatedAt

string<date-time>

required

Pattern:

^(?:(?:\d\d[2468][048]|\d\d[13579][26]|\d\d0[48]|[02468][048]00|[13579][26]00)-02-29|\d{4}-(?:(?:0[13578]|1[02])-(?:0[1-9]|[12]\d|3[01])|(?:0[469]|11)-(?:0[1-9]|[12]\d|30)|(?:02)-(?:0[1-9]|1\d|2[0-8])))T(?:(?:[01]\d|2[0-3]):[0-5]\d(?::[0-5]\d(?:\.\d+)?)?(?:Z))$

data.status

object

required

Hide child attributes

data.status.type

enum<string>

required

Available options:

ERROR,

PENDING,

SUCCESS,

INITIALIZED

data.status.data

any

Get document

Upload table document

Conversations API

Analytics API

Knowledge base API

Project API

Webhooks

Authorizations

Headers

Query Parameters

Body

Response