Chunk using semantic chunker

import requests

url = "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}"

payload = {
    "batch": [{ "text": "The content to be split into chunks. " }],
    "modelConfig": {
        "vectorQuantizationMethod": "min-max",
        "dimReductionSize": 256
    },
    "useCaseConfig": { "dataType": "query" },
    "chunkerConfig": {
        "maxChunkSize": 512,
        "overlapSize": 1,
        "cosineThreshold": 0.567,
        "approximate": True
    }
}
headers = {
    "Authorization": "<authorization>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

HttpResponse<String> response = Unirest.post("https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}")
  .header("Authorization", "<authorization>")
  .header("Content-Type", "application/json")
  .body("{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}")
  .asString();

const options = {
  method: 'POST',
  headers: {Authorization: '<authorization>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    batch: [{text: 'The content to be split into chunks. '}],
    modelConfig: {vectorQuantizationMethod: 'min-max', dimReductionSize: 256},
    useCaseConfig: {dataType: 'query'},
    chunkerConfig: {maxChunkSize: 512, overlapSize: 1, cosineThreshold: 0.567, approximate: true}
  })
};

fetch('https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

require 'uri'
require 'net/http'

url = URI("https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = '<authorization>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}"

response = http.request(request)
puts response.read_body

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}"

	payload := strings.NewReader("{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "<authorization>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'batch' => [
        [
                'text' => 'The content to be split into chunks. '
        ]
    ],
    'modelConfig' => [
        'vectorQuantizationMethod' => 'min-max',
        'dimReductionSize' => 256
    ],
    'useCaseConfig' => [
        'dataType' => 'query'
    ],
    'chunkerConfig' => [
        'maxChunkSize' => 512,
        'overlapSize' => 1,
        'cosineThreshold' => 0.567,
        'approximate' => true
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

curl --request POST \
  --url https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID} \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "batch": [
    {
      "text": "The content to be split into chunks. "
    }
  ],
  "modelConfig": {
    "vectorQuantizationMethod": "min-max",
    "dimReductionSize": 256
  },
  "useCaseConfig": {
    "dataType": "query"
  },
  "chunkerConfig": {
    "maxChunkSize": 512,
    "overlapSize": 1,
    "cosineThreshold": 0.567,
    "approximate": true
  }
}
'

{
  "chunkingId": "441eb3be-7de6-470a-8141-e416a15c7db1",
  "status": "SUBMITTED"
}

{
  "chunkingId": "441eb3be-7de6-470a-8141-e416a15c7db1",
  "status": "READY",
  "message": "<string>"
}

Chunk using semantic chunker

The semantic chunker (chunking strategy) creates chunks based on semantic similarity.

Using the model defined in the URL request, the semantic chunker splits text into sentences, encodes the sentences, and then compares the sentence to the building chunk to determine if they are similar enough to group together.

After merging two semantically-similar sentences into a pre-chunk, the semantic chunker needs to encode it to get its vector to compare with the next sentence vector.

This chunker is the slowest of all of the chunkers even if you set the approximate field to true.

POST

async-chunking

semantic

{MODEL_ID}

Chunk using semantic chunker

import requests

url = "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}"

payload = {
    "batch": [{ "text": "The content to be split into chunks. " }],
    "modelConfig": {
        "vectorQuantizationMethod": "min-max",
        "dimReductionSize": 256
    },
    "useCaseConfig": { "dataType": "query" },
    "chunkerConfig": {
        "maxChunkSize": 512,
        "overlapSize": 1,
        "cosineThreshold": 0.567,
        "approximate": True
    }
}
headers = {
    "Authorization": "<authorization>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

HttpResponse<String> response = Unirest.post("https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}")
  .header("Authorization", "<authorization>")
  .header("Content-Type", "application/json")
  .body("{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}")
  .asString();

const options = {
  method: 'POST',
  headers: {Authorization: '<authorization>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    batch: [{text: 'The content to be split into chunks. '}],
    modelConfig: {vectorQuantizationMethod: 'min-max', dimReductionSize: 256},
    useCaseConfig: {dataType: 'query'},
    chunkerConfig: {maxChunkSize: 512, overlapSize: 1, cosineThreshold: 0.567, approximate: true}
  })
};

fetch('https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

require 'uri'
require 'net/http'

url = URI("https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = '<authorization>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}"

response = http.request(request)
puts response.read_body

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}"

	payload := strings.NewReader("{\n  \"batch\": [\n    {\n      \"text\": \"The content to be split into chunks. \"\n    }\n  ],\n  \"modelConfig\": {\n    \"vectorQuantizationMethod\": \"min-max\",\n    \"dimReductionSize\": 256\n  },\n  \"useCaseConfig\": {\n    \"dataType\": \"query\"\n  },\n  \"chunkerConfig\": {\n    \"maxChunkSize\": 512,\n    \"overlapSize\": 1,\n    \"cosineThreshold\": 0.567,\n    \"approximate\": true\n  }\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "<authorization>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'batch' => [
        [
                'text' => 'The content to be split into chunks. '
        ]
    ],
    'modelConfig' => [
        'vectorQuantizationMethod' => 'min-max',
        'dimReductionSize' => 256
    ],
    'useCaseConfig' => [
        'dataType' => 'query'
    ],
    'chunkerConfig' => [
        'maxChunkSize' => 512,
        'overlapSize' => 1,
        'cosineThreshold' => 0.567,
        'approximate' => true
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: <authorization>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

curl --request POST \
  --url https://application_id.applications.lucidworks.com/ai/async-chunking/semantic/{MODEL_ID} \
  --header 'Authorization: <authorization>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "batch": [
    {
      "text": "The content to be split into chunks. "
    }
  ],
  "modelConfig": {
    "vectorQuantizationMethod": "min-max",
    "dimReductionSize": 256
  },
  "useCaseConfig": {
    "dataType": "query"
  },
  "chunkerConfig": {
    "maxChunkSize": 512,
    "overlapSize": 1,
    "cosineThreshold": 0.567,
    "approximate": true
  }
}
'

{
  "chunkingId": "441eb3be-7de6-470a-8141-e416a15c7db1",
  "status": "SUBMITTED"
}

{
  "chunkingId": "441eb3be-7de6-470a-8141-e416a15c7db1",
  "status": "READY",
  "message": "<string>"
}

Headers

Authorization

string

required

Bearer token used for authentication. Format: Authorization: Bearer ACCESS_TOKEN.

Content-Type

string

application/json

Example:

"application/json"

Path Parameters

MODEL_ID

string

required

Unique identifier for the model.

Example:

"gte-small"

Body

application/json

batch

object[]

The batch of key:value pairs used in the chunking request.

Show child attributes

modelConfig

ModelConfig · object

Provides fields and values that specify ranges for tokens.

Show child attributes

useCaseConfig

UseCaseConfigChunking · object

Show child attributes

chunkerConfig

SemanticChunkerConfig · object

The semantic chunker (chunking strategy) creates chunks based on semantic similarity.

After merging two semantically-similar sentences into a pre-chunk, the semantic chunker needs to encode it to get its vector to compare with the next sentence vector.

This chunker is the slowest of all of the chunkers even if you set the approximate field to true.

This is the default chunker configuration if nothing is passed.

Show child attributes

Response

This is the response to the POST chunking request submitted for a specific chunker and modelId.

chunkingId

string<uuid>

The universal unique identifier (UUID) returned in the POST request. This UUID is required in the GET request to retrieve results.

Example:

"441eb3be-7de6-470a-8141-e416a15c7db1"

status

string

The current status of the request. Allowed values are:

SUBMITTED - The POST request was successful and the response has returned the chunkingId and status that is used by the GET request.
ERROR - An error was generated when the GET request was sent.
READY - The results associated with the chunkingId are available and ready to be retrieved.
RETRIEVED - The results associated with the chunkingId are returned successfully when the GET request was sent.

Example:

"SUBMITTED"

Split text on a regex Split text on sentences