Update web crawl setting

Python

import os
from qaip import Qaip

client = Qaip(
    api_key=os.environ.get("QAIP_API_KEY"),  # This is the default and can be omitted
)
crawl_setting = client.crawls.update_setting(
    id="id",
    name="name",
)
print(crawl_setting.id)

curl --request PUT \
  --url https://developer.qaip.com/api/v1/crawl-settings/{id} \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "name": "<string>",
  "rrule": "<string>"
}
'

const options = {
  method: 'PUT',
  headers: {'x-api-key': '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({name: '<string>', rrule: '<string>'})
};

fetch('https://developer.qaip.com/api/v1/crawl-settings/{id}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://developer.qaip.com/api/v1/crawl-settings/{id}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "PUT",
  CURLOPT_POSTFIELDS => json_encode([
    'name' => '<string>',
    'rrule' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://developer.qaip.com/api/v1/crawl-settings/{id}"

	payload := strings.NewReader("{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}")

	req, _ := http.NewRequest("PUT", url, payload)

	req.Header.Add("x-api-key", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.put("https://developer.qaip.com/api/v1/crawl-settings/{id}")
  .header("x-api-key", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://developer.qaip.com/api/v1/crawl-settings/{id}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Put.new(url)
request["x-api-key"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

{
  "id": "<string>",
  "name": "<string>",
  "start_url": "<string>",
  "max_depth": 123,
  "html_only": true,
  "use_browser": true,
  "path_filters": [
    "<string>"
  ],
  "content_pattern": [
    "<string>"
  ],
  "max_num_files": 123,
  "file_extensions": [
    "<string>"
  ],
  "rrule": "<string>"
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

PUT

crawl-settings

{id}

Python

import os
from qaip import Qaip

client = Qaip(
    api_key=os.environ.get("QAIP_API_KEY"),  # This is the default and can be omitted
)
crawl_setting = client.crawls.update_setting(
    id="id",
    name="name",
)
print(crawl_setting.id)

curl --request PUT \
  --url https://developer.qaip.com/api/v1/crawl-settings/{id} \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "name": "<string>",
  "rrule": "<string>"
}
'

const options = {
  method: 'PUT',
  headers: {'x-api-key': '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({name: '<string>', rrule: '<string>'})
};

fetch('https://developer.qaip.com/api/v1/crawl-settings/{id}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://developer.qaip.com/api/v1/crawl-settings/{id}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "PUT",
  CURLOPT_POSTFIELDS => json_encode([
    'name' => '<string>',
    'rrule' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://developer.qaip.com/api/v1/crawl-settings/{id}"

	payload := strings.NewReader("{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}")

	req, _ := http.NewRequest("PUT", url, payload)

	req.Header.Add("x-api-key", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.put("https://developer.qaip.com/api/v1/crawl-settings/{id}")
  .header("x-api-key", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://developer.qaip.com/api/v1/crawl-settings/{id}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Put.new(url)
request["x-api-key"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"name\": \"<string>\",\n  \"rrule\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

{
  "id": "<string>",
  "name": "<string>",
  "start_url": "<string>",
  "max_depth": 123,
  "html_only": true,
  "use_browser": true,
  "path_filters": [
    "<string>"
  ],
  "content_pattern": [
    "<string>"
  ],
  "max_num_files": 123,
  "file_extensions": [
    "<string>"
  ],
  "rrule": "<string>"
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>"
  }
}

Authorizations

x-api-key

string

header

required

API key for authentication

Path Parameters

string

required

Ingestion setting ID for the web crawl data source

Body

application/json

name

string

required

Name of the web crawl data source

Maximum string length: 200

rrule

string

Recurrence rule (RFC 5545 RRULE). Empty string or omission removes the existing schedule.

Response

Successfully updated web crawl setting

string

required

Web crawl ingestion setting ID

name

string

required

Name of the web crawl ingestion setting

start_url

string

required

Start URL of the web crawl

max_depth

integer

required

Maximum crawl depth

html_only

boolean

required

When true, only HTML files will be downloaded

use_browser

boolean

required

Whether to use a headless browser for crawling

path_filters

string[]

Path filters for crawling

content_pattern

string[]

Content patterns for filtering

max_num_files

integer | null

Maximum number of files to crawl

file_extensions

string[]

File extensions to include (e.g. ".pdf", ".docx")

rrule

string

Recurrence rule (RFC 5545 RRULE)

Get web crawl setting List GitHub data sources

⌘I