Processing pipeline

This page provides an overview of APIs related to processing pipeline.

View Processing pipeline dataflow accessible via a POST call to [http|https]://[hostname]:[port]/[apiversion]/tenants/[tenantguid]/processing.

Processing pipeline (storage)

To request Processing pipeline (storage), attach the body of the object to the request

curl --location 'http://view.homedns.org:8000/v1.0/tenants/00000000-0000-0000-0000-000000000000/processing' \
--header 'Content-Type: application/json' \
--header 'Authorization: ••••••' \
--data '{
    "Async": true,
    "Tenant": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "Default Tenant",
        "Region": "us-west-1",
        "S3BaseDomain": "localhost",
        "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
        "Active": true
    },
    "Collection":     {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My first collection",
        "AllowOverwrites": true,
        "AdditionalData": "Created by setup"
    },
    "Bucket":     {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Category": "Data",
        "Name": "example-data-bucket",
        "RegionString": "us-west-1",
        "Versioning": true,
        "MaxMultipartUploadSeconds": 604800
    },
    "Pool": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "default",
        "Provider": "Disk",
        "WriteMode": "GUID",
        "UseSsl": false,
        "DiskDirectory": "./disk/",
        "Compress": "None",
        "EnableReadCaching": false
    },
    "Object": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "ParentGUID": null,
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "TenantName": "My default tenant",
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "BucketName": "data",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Key": "hello1.txt",
        "Version": "1",
        "ContentType": "text/plain",
        "DocumentType": "Text",
        "ContentLength": 13
    },
    "MetadataRule": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "example-metadata-rule",
        "ContentType": "*",
        "MaxContentLength": 16777216,
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
        "SemanticCellEndpoint": "http://localhost:8341/",
        "MaxChunkContentLength": 512,
        "ShiftSize": 448,
        "UdrEndpoint": "http://localhost:8321/",
        "TopTerms": 25,
        "CaseInsensitive": true,
        "IncludeFlattened": true,
        "DataCatalogEndpoint": "http://localhost:8201/",
        "DataCatalogType": "Lexi",
        "DataCatalogCollection": "default",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "TargetBucketGUID": "00000000-0000-0000-0000-000000000000"
    },
    "EmbeddingsRule": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My storage server embeddings rule",
        "ContentType": "*",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "EmbeddingsGenerator": "LCProxy",
        "GeneratorUrl": "http://localhost:8301/",
        "GeneratorApiKey": "",
        "VectorStoreUrl": "http://localhost:8311/",
        "MaxContentLength": 16777216
    },
    "VectorRepository": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My vector repository",
        "RepositoryType": "Pgvector",
        "Model": "all-MiniLM-L6-v2",
        "Dimensionality": 384,
        "DatabaseHostname": "localhost",
        "DatabaseName": "vectordb",
        "DatabaseTable": "minilm",
        "DatabasePort": 5432,
        "DatabaseUser": "postgres",
        "DatabasePassword": "password"
    },
    "GraphRepository": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My LiteGraph instance",
        "RepositoryType": "LiteGraph",
        "EndpointUrl": "http://localhost:8701/",
        "ApiKey": "default",
        "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
    }
}
'
import { ViewProcessorSdk } from "view-sdk";

const processor = new ViewProcessorSdk(
  "00000000-0000-0000-0000-000000000000", //tenant Id
  "default", //access token
  "http://localhost:8000/" //endpoint
);

const processingPipeline = async () => {
  try {
    const response = await processor.processingPipeline({
      "Async": true,
      "Tenant": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "Name": "Default Tenant",
          "Region": "us-west-1",
          "S3BaseDomain": "localhost",
          "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
          "Active": true
      },
      "Collection":     {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "Name": "My first collection",
          "AllowOverwrites": true,
          "AdditionalData": "Created by setup"
      },
      "Bucket":     {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "PoolGUID": "00000000-0000-0000-0000-000000000000",
          "OwnerGUID": "00000000-0000-0000-0000-000000000000",
          "Category": "Data",
          "Name": "example-data-bucket",
          "RegionString": "us-west-1",
          "Versioning": true,
          "MaxMultipartUploadSeconds": 604800
      },
      "Pool": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "Name": "default",
          "Provider": "Disk",
          "WriteMode": "GUID",
          "UseSsl": false,
          "DiskDirectory": "./disk/",
          "Compress": "None",
          "EnableReadCaching": false
      },
      "Object": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "ParentGUID": null,
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "TenantName": "My default tenant",
          "PoolGUID": "00000000-0000-0000-0000-000000000000",
          "BucketGUID": "00000000-0000-0000-0000-000000000000",
          "BucketName": "data",
          "OwnerGUID": "00000000-0000-0000-0000-000000000000",
          "Key": "hello1.txt",
          "Version": "1",
          "ContentType": "text/plain",
          "DocumentType": "Text",
          "ContentLength": 13
      },
      "MetadataRule": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "BucketGUID": "00000000-0000-0000-0000-000000000000",
          "OwnerGUID": "00000000-0000-0000-0000-000000000000",
          "Name": "example-metadata-rule",
          "ContentType": "*",
          "MaxContentLength": 16777216,
          "DataFlowEndpoint": "http://localhost:8501/processor",
          "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
          "SemanticCellEndpoint": "http://localhost:8341/",
          "MaxChunkContentLength": 512,
          "ShiftSize": 448,
          "UdrEndpoint": "http://localhost:8321/",
          "TopTerms": 25,
          "CaseInsensitive": true,
          "IncludeFlattened": true,
          "DataCatalogEndpoint": "http://localhost:8201/",
          "DataCatalogType": "Lexi",
          "DataCatalogCollection": "default",
          "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
          "TargetBucketGUID": "00000000-0000-0000-0000-000000000000"
      },
      "EmbeddingsRule": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "BucketGUID": "00000000-0000-0000-0000-000000000000",
          "OwnerGUID": "00000000-0000-0000-0000-000000000000",
          "Name": "My storage server embeddings rule",
          "ContentType": "*",
          "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
          "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
          "DataFlowEndpoint": "http://localhost:8501/processor",
          "EmbeddingsGenerator": "LCProxy",
          "GeneratorUrl": "http://localhost:8301/",
          "GeneratorApiKey": "",
          "VectorStoreUrl": "http://localhost:8311/",
          "MaxContentLength": 16777216
      },
      "VectorRepository": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "Name": "My vector repository",
          "RepositoryType": "Pgvector",
          "Model": "all-MiniLM-L6-v2",
          "Dimensionality": 384,
          "DatabaseHostname": "localhost",
          "DatabaseName": "vectordb",
          "DatabaseTable": "minilm",
          "DatabasePort": 5432,
          "DatabaseUser": "postgres",
          "DatabasePassword": "password"
      },
      "GraphRepository": {
          "GUID": "00000000-0000-0000-0000-000000000000",
          "TenantGUID": "00000000-0000-0000-0000-000000000000",
          "Name": "My LiteGraph instance",
          "RepositoryType": "LiteGraph",
          "EndpointUrl": "http://localhost:8701/",
          "ApiKey": "default",
          "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
      }
  }
  );
    console.log(response);
  } catch (err) {
    console.log("Error", err);
  }
};

processingPipeline();
import view_sdk
from view_sdk import processor

sdk = view_sdk.configure( access_key="default",base_url="localhost", tenant_guid= "00000000-0000-0000-0000-000000000000")

def processingPipeline():
    result = processor.Processor.processing_pipeline( Async= True,
    Tenant= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "Default Tenant",
        "Region": "us-west-1",
        "S3BaseDomain": "localhost",
        "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
        "Active": True
    },
    Collection={
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My first collection",
        "AllowOverwrites": True,
        "AdditionalData": "Created by setup"
    },
    Bucket={
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Category": "Data",
        "Name": "example-data-bucket",
        "RegionString": "us-west-1",
        "Versioning": True,
        "MaxMultipartUploadSeconds": 604800
    },
    Pool={
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "default",
        "Provider": "Disk",
        "WriteMode": "GUID",
        "UseSsl": False,
        "DiskDirectory": "./disk/",
        "Compress": "None",
        "EnableReadCaching": False
    },
    Object= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "ParentGUID": None,
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "TenantName": "My default tenant",
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "BucketName": "data",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Key": "hello1.txt",
        "Version": "1",
        "ContentType": "text/plain",
        "DocumentType": "Text",
        "ContentLength": 13
    },
    MetadataRule= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "example-metadata-rule",
        "ContentType": "*",
        "MaxContentLength": 16777216,
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
        "SemanticCellEndpoint": "http://localhost:8341/",
        "MaxChunkContentLength": 512,
        "ShiftSize": 448,
        "UdrEndpoint": "http://localhost:8321/",
        "TopTerms": 25,
        "CaseInsensitive": True,
        "IncludeFlattened": True,
        "DataCatalogEndpoint": "http://localhost:8201/",
        "DataCatalogType": "Lexi",
        "DataCatalogCollection": "default",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "TargetBucketGUID": "00000000-0000-0000-0000-000000000000"
    },
    EmbeddingsRule= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My storage server embeddings rule",
        "ContentType": "*",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "EmbeddingsGenerator": "LCProxy",
        "GeneratorUrl": "http://localhost:8301/",
        "GeneratorApiKey": "",
        "VectorStoreUrl": "http://localhost:8311/",
        "MaxContentLength": 16777216
    },
    VectorRepository= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My vector repository",
        "RepositoryType": "Pgvector",
        "Model": "all-MiniLM-L6-v2",
        "Dimensionality": 384,
        "DatabaseHostname": "localhost",
        "DatabaseName": "vectordb",
        "DatabaseTable": "minilm",
        "DatabasePort": 5432,
        "DatabaseUser": "postgres",
        "DatabasePassword": "password"
    },
    GraphRepository= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My LiteGraph instance",
        "RepositoryType": "LiteGraph",
        "EndpointUrl": "http://localhost:8701/",
        "ApiKey": "default",
        "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
    })
    print(result)

processingPipeline()

Response

{
    "GUID": "3292d8eb-642b-40f4-a2de-9b81e66de288",
    "Success": true,
    "Async": true,
    "Timestamp": {
        "Start": "2025-04-30T13:19:30.096373Z",
        "TotalMs": 34.2,
        "Messages": {}
    }
}

Processing pipeline (crawler)

To request Processing pipeline (crawler), attach the body of the object to the request

curl --location 'http://view.homedns.org:8000/v1.0/tenants/00000000-0000-0000-0000-000000000000/processing' \
--header 'Content-Type: application/json' \
--header 'Authorization: ••••••' \
--data '{
    "Async": true,
    "Tenant": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "Default Tenant",
        "Region": "us-west-1",
        "S3BaseDomain": "localhost",
        "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
        "Active": true
    },
    "Collection": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My first collection",
        "AllowOverwrites": true,
        "AdditionalData": "Created by setup"
    },
    "DataRepository": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My disk data repository",
        "RepositoryType": "File",
        "DiskDirectory": "./disk/"
    },
    "Object": {
        "GUID": "00000000-0000-0000-0000-000000000001",
        "ParentGUID": null,
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "TenantName": "My default tenant",
        "NodeGUID": null,
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "BucketName": "data",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Key": "hello2.txt",
        "Version": "1",
        "ContentType": "text/plain",
        "DocumentType": "Text",
        "ContentLength": 13,
        "Data": "VGhpcyBpcyBhIHNhbXBsZSBkb2N1bWVudCB3aXRoIGp1c3QgYSBoYW5kZnVsIG9mIHdvcmRzIHRoYXQgd2lsbCBiZSBwcm9jZXNzZWQgYnkgVmlldw=="
    },
    "MetadataRule": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "example-metadata-rule",
        "ContentType": "*",
        "MaxContentLength": 16777216,
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
        "SemanticCellEndpoint": "http://localhost:8341/",
        "MaxChunkContentLength": 512,
        "ShiftSize": 448,
        "UdrEndpoint": "http://localhost:8321/",
        "TopTerms": 25,
        "CaseInsensitive": true,
        "IncludeFlattened": true,
        "DataCatalogEndpoint": "http://localhost:8201/",
        "DataCatalogType": "Lexi",
        "DataCatalogCollection": "00000000-0000-0000-0000-000000000000",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000"
    },
    "EmbeddingsRule": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My storage server embeddings rule",
        "ContentType": "*",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "EmbeddingsGenerator": "LCProxy",
        "GeneratorUrl": "http://localhost:8301/",
        "GeneratorApiKey": "",
        "VectorStoreUrl": "http://localhost:8311/",
        "MaxContentLength": 16777216
    },
    "VectorRepository": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My vector repository",
        "RepositoryType": "Pgvector",
        "Model": "all-MiniLM-L6-v2",
        "Dimensionality": 384,
        "DatabaseHostname": "localhost",
        "DatabaseName": "vectordb",
        "DatabaseTable": "minilm",
        "DatabasePort": 5432,
        "DatabaseUser": "postgres",
        "DatabasePassword": "password"
    },
    "GraphRepository": {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My LiteGraph instance",
        "RepositoryType": "LiteGraph",
        "EndpointUrl": "http://localhost:8701/",
        "ApiKey": "default",
        "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
    }
}
'
import { ViewProcessorSdk } from "view-sdk";

const processor = new ViewProcessorSdk(
  "00000000-0000-0000-0000-000000000000", //tenant Id
  "default", //access token
  "http://localhost:8000/" //endpoint
);

const processingPipeline = async () => {
  try {
    const response = await processor.processingPipeline({
        "Async": true,
        "Tenant": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "Name": "Default Tenant",
            "Region": "us-west-1",
            "S3BaseDomain": "localhost",
            "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
            "Active": true
        },
        "Collection": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "My first collection",
            "AllowOverwrites": true,
            "AdditionalData": "Created by setup"
        },
        "DataRepository": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "OwnerGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "My disk data repository",
            "RepositoryType": "File",
            "DiskDirectory": "./disk/"
        },
        "Object": {
            "GUID": "00000000-0000-0000-0000-000000000001",
            "ParentGUID": null,
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "TenantName": "My default tenant",
            "NodeGUID": null,
            "PoolGUID": "00000000-0000-0000-0000-000000000000",
            "BucketGUID": "00000000-0000-0000-0000-000000000000",
            "BucketName": "data",
            "OwnerGUID": "00000000-0000-0000-0000-000000000000",
            "Key": "hello2.txt",
            "Version": "1",
            "ContentType": "text/plain",
            "DocumentType": "Text",
            "ContentLength": 13,
            "Data": "VGhpcyBpcyBhIHNhbXBsZSBkb2N1bWVudCB3aXRoIGp1c3QgYSBoYW5kZnVsIG9mIHdvcmRzIHRoYXQgd2lsbCBiZSBwcm9jZXNzZWQgYnkgVmlldw=="
        },
        "MetadataRule": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "BucketGUID": "00000000-0000-0000-0000-000000000000",
            "OwnerGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "example-metadata-rule",
            "ContentType": "*",
            "MaxContentLength": 16777216,
            "DataFlowEndpoint": "http://localhost:8501/processor",
            "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
            "SemanticCellEndpoint": "http://localhost:8341/",
            "MaxChunkContentLength": 512,
            "ShiftSize": 448,
            "UdrEndpoint": "http://localhost:8321/",
            "TopTerms": 25,
            "CaseInsensitive": true,
            "IncludeFlattened": true,
            "DataCatalogEndpoint": "http://localhost:8201/",
            "DataCatalogType": "Lexi",
            "DataCatalogCollection": "00000000-0000-0000-0000-000000000000",
            "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000"
        },
        "EmbeddingsRule": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "BucketGUID": "00000000-0000-0000-0000-000000000000",
            "OwnerGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "My storage server embeddings rule",
            "ContentType": "*",
            "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
            "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
            "DataFlowEndpoint": "http://localhost:8501/processor",
            "EmbeddingsGenerator": "LCProxy",
            "GeneratorUrl": "http://localhost:8301/",
            "GeneratorApiKey": "",
            "VectorStoreUrl": "http://localhost:8311/",
            "MaxContentLength": 16777216
        },
        "VectorRepository": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "My vector repository",
            "RepositoryType": "Pgvector",
            "Model": "all-MiniLM-L6-v2",
            "Dimensionality": 384,
            "DatabaseHostname": "localhost",
            "DatabaseName": "vectordb",
            "DatabaseTable": "minilm",
            "DatabasePort": 5432,
            "DatabaseUser": "postgres",
            "DatabasePassword": "password"
        },
        "GraphRepository": {
            "GUID": "00000000-0000-0000-0000-000000000000",
            "TenantGUID": "00000000-0000-0000-0000-000000000000",
            "Name": "My LiteGraph instance",
            "RepositoryType": "LiteGraph",
            "EndpointUrl": "http://localhost:8701/",
            "ApiKey": "default",
            "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
        }
    }
  );
    console.log(response);
  } catch (err) {
    console.log("Error", err);
  }
};

processingPipeline();
import view_sdk
from view_sdk import processor

sdk = view_sdk.configure( access_key="default",base_url="localhost", tenant_guid= "00000000-0000-0000-0000-000000000000")

def processingPipeline():
    result = processor.Processor.process_crawler(Async=True,
    Tenant= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "Name": "Default Tenant",
        "Region": "us-west-1",
        "S3BaseDomain": "localhost",
        "DefaultPoolGUID": "00000000-0000-0000-0000-000000000000",
        "Active": True
    },
    Collection= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My first collection",
        "AllowOverwrites": True,
        "AdditionalData": "Created by setup"
    },
    DataRepository= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My disk data repository",
        "RepositoryType": "File",
        "DiskDirectory": "./disk/"
    },
    Object= {
        "GUID": "00000000-0000-0000-0000-000000000001",
        "ParentGUID": None,
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "TenantName": "My default tenant",
        "NodeGUID": None,
        "PoolGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "BucketName": "data",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Key": "hello2.txt",
        "Version": "1",
        "ContentType": "text/plain",
        "DocumentType": "Text",
        "ContentLength": 13,
        "Data": "VGhpcyBpcyBhIHNhbXBsZSBkb2N1bWVudCB3aXRoIGp1c3QgYSBoYW5kZnVsIG9mIHdvcmRzIHRoYXQgd2lsbCBiZSBwcm9jZXNzZWQgYnkgVmlldw=="
    },
    MetadataRule= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "example-metadata-rule",
        "ContentType": "*",
        "MaxContentLength": 16777216,
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "TypeDetectorEndpoint": "http://localhost:8501/processor/typedetector",
        "SemanticCellEndpoint": "http://localhost:8341/",
        "MaxChunkContentLength": 512,
        "ShiftSize": 448,
        "UdrEndpoint": "http://localhost:8321/",
        "TopTerms": 25,
        "CaseInsensitive": True,
        "IncludeFlattened": True,
        "DataCatalogEndpoint": "http://localhost:8201/",
        "DataCatalogType": "Lexi",
        "DataCatalogCollection": "00000000-0000-0000-0000-000000000000",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000"
    },
    EmbeddingsRule= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "BucketGUID": "00000000-0000-0000-0000-000000000000",
        "OwnerGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My storage server embeddings rule",
        "ContentType": "*",
        "GraphRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "VectorRepositoryGUID": "00000000-0000-0000-0000-000000000000",
        "DataFlowEndpoint": "http://localhost:8501/processor",
        "EmbeddingsGenerator": "LCProxy",
        "GeneratorUrl": "http://localhost:8301/",
        "GeneratorApiKey": "",
        "VectorStoreUrl": "http://localhost:8311/",
        "MaxContentLength": 16777216
    },
    VectorRepository= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My vector repository",
        "RepositoryType": "Pgvector",
        "Model": "all-MiniLM-L6-v2",
        "Dimensionality": 384,
        "DatabaseHostname": "localhost",
        "DatabaseName": "vectordb",
        "DatabaseTable": "minilm",
        "DatabasePort": 5432,
        "DatabaseUser": "postgres",
        "DatabasePassword": "password"
    },
    GraphRepository= {
        "GUID": "00000000-0000-0000-0000-000000000000",
        "TenantGUID": "00000000-0000-0000-0000-000000000000",
        "Name": "My LiteGraph instance",
        "RepositoryType": "LiteGraph",
        "EndpointUrl": "http://localhost:8701/",
        "ApiKey": "default",
        "GraphIdentifier": "00000000-0000-0000-0000-000000000000"
    })
    print(result)

processingPipeline()

Response

{
    "GUID": "3292d8eb-642b-40f4-a2de-9b81e66de288",
    "Success": true,
    "Async": true,
    "Timestamp": {
        "Start": "2025-04-30T13:19:30.096373Z",
        "TotalMs": 34.2,
        "Messages": {}
    }
}