Get web crawl setting

Python

import os
from qaip import Qaip

client = Qaip(
    api_key=os.environ.get("QAIP_API_KEY"),  # This is the default and can be omitted
)
crawl_setting = client.crawls.retrieve_setting(
    "id",
)
print(crawl_setting.id)

curl --request GET \
  --url https://developer.qaip.com/api/v1/crawl-settings/{id} \
  --header 'x-api-key: <api-key>'

const options = {method: 'GET', headers: {'x-api-key': '<api-key>'}};

fetch('https://developer.qaip.com/api/v1/crawl-settings/{id}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://developer.qaip.com/api/v1/crawl-settings/{id}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "GET",
  CURLOPT_HTTPHEADER => [
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"net/http"
	"io"
)

func main() {

	url := "https://developer.qaip.com/api/v1/crawl-settings/{id}"

	req, _ := http.NewRequest("GET", url, nil)

	req.Header.Add("x-api-key", "<api-key>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.get("https://developer.qaip.com/api/v1/crawl-settings/{id}")
  .header("x-api-key", "<api-key>")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://developer.qaip.com/api/v1/crawl-settings/{id}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Get.new(url)
request["x-api-key"] = '<api-key>'

response = http.request(request)
puts response.read_body

{
  "id": "<string>",
  "name": "<string>",
  "start_url": "<string>",
  "max_depth": 123,
  "html_only": true,
  "use_browser": true,
  "path_filters": [
    "<string>"
  ],
  "content_pattern": [
    "<string>"
  ],
  "max_num_files": 123,
  "file_extensions": [
    "<string>"
  ],
  "rrule": "<string>"
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

GET

crawl-settings

{id}

Python

import os
from qaip import Qaip

client = Qaip(
    api_key=os.environ.get("QAIP_API_KEY"),  # This is the default and can be omitted
)
crawl_setting = client.crawls.retrieve_setting(
    "id",
)
print(crawl_setting.id)

curl --request GET \
  --url https://developer.qaip.com/api/v1/crawl-settings/{id} \
  --header 'x-api-key: <api-key>'

const options = {method: 'GET', headers: {'x-api-key': '<api-key>'}};

fetch('https://developer.qaip.com/api/v1/crawl-settings/{id}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://developer.qaip.com/api/v1/crawl-settings/{id}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "GET",
  CURLOPT_HTTPHEADER => [
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"net/http"
	"io"
)

func main() {

	url := "https://developer.qaip.com/api/v1/crawl-settings/{id}"

	req, _ := http.NewRequest("GET", url, nil)

	req.Header.Add("x-api-key", "<api-key>")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.get("https://developer.qaip.com/api/v1/crawl-settings/{id}")
  .header("x-api-key", "<api-key>")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://developer.qaip.com/api/v1/crawl-settings/{id}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Get.new(url)
request["x-api-key"] = '<api-key>'

response = http.request(request)
puts response.read_body

{
  "id": "<string>",
  "name": "<string>",
  "start_url": "<string>",
  "max_depth": 123,
  "html_only": true,
  "use_browser": true,
  "path_filters": [
    "<string>"
  ],
  "content_pattern": [
    "<string>"
  ],
  "max_num_files": 123,
  "file_extensions": [
    "<string>"
  ],
  "rrule": "<string>"
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

Authorizations

x-api-key

string

header

required

API key for authentication

Path Parameters

string

required

Ingestion setting ID for the web crawl data source

Response

Successful retrieval of web crawl setting

string

required

Web crawl ingestion setting ID

name

string

required

Name of the web crawl ingestion setting

start_url

string

required

Start URL of the web crawl

max_depth

integer

required

Maximum crawl depth

html_only

boolean

required

When true, only HTML files will be downloaded

use_browser

boolean

required

Whether to use a headless browser for crawling

path_filters

string[]

Path filters for crawling

content_pattern

string[]

Content patterns for filtering

max_num_files

integer | null

Maximum number of files to crawl

file_extensions

string[]

File extensions to include (e.g. ".pdf", ".docx")

rrule

string

Recurrence rule (RFC 5545 RRULE)

Start deletion of web crawl data source Update web crawl setting

⌘I