Web crawler job

List Web Crawler Jobs

Lists web crawler jobs.

GET
/web-crawler-jobs.list
AuthorizationBearer <token>

All the DevRev APIs require a token to authenticate the user. Provide Authorization: Bearer <TOKEN> as a header to every API request. How do I find my token?

In: header

Query Parameters

created_by?array<string>

Filters for web crawler jobs created by any of the provided users.

cursor?string

The cursor to resume iteration from. If not provided, then iteration starts from the beginning.

Formattext
limit?integer

The maximum number of web crawler jobs to return. The default is '50'.

Formatint32
mode?string

The iteration mode to use, otherwise if not set, then "after" is used.

Value in"after" | "before"

Response Body

curl -X GET "https://api.devrev.ai/web-crawler-jobs.list?created_by=DEVU-12345&cursor=string&limit=0&mode=after"
{
  "next_cursor": "string",
  "prev_cursor": "string",
  "web_crawler_jobs": [
    {
      "created_by": {
        "type": "dev_user",
        "display_id": "string",
        "id": "string",
        "display_name": "string",
        "display_picture": {
          "display_id": "string",
          "id": "string",
          "file": {
            "type": "string",
            "name": "string",
            "size": 0
          }
        },
        "email": "string",
        "full_name": "string",
        "state": "active"
      },
      "created_date": "2023-01-01T12:00:00.000Z",
      "display_id": "string",
      "id": "string",
      "modified_by": {
        "type": "dev_user",
        "display_id": "string",
        "id": "string",
        "display_name": "string",
        "display_picture": {
          "display_id": "string",
          "id": "string",
          "file": {
            "type": "string",
            "name": "string",
            "size": 0
          }
        },
        "email": "string",
        "full_name": "string",
        "state": "active"
      },
      "modified_date": "2023-01-01T12:00:00.000Z",
      "accept_regexs": [
        "string"
      ],
      "description": "string",
      "domain_names": [
        "string"
      ],
      "frequency": 0,
      "max_depth": 0,
      "no_parent": true,
      "notify_on_complete": true,
      "num_bytes": 0,
      "num_timeout_urls": 0,
      "num_urls_scraped": 0,
      "reject_regexs": [
        "string"
      ],
      "sitemap_index_urls": [
        "string"
      ],
      "sitemap_urls": [
        "string"
      ],
      "state": "aborted",
      "urls": [
        "string"
      ],
      "user_agent": "string"
    }
  ]
}
{
  "detail": "string",
  "message": "string",
  "type": "artifact_already_attached_to_a_parent",
  "existing_parent": "string",
  "is_same": true
}
{
  "detail": "string",
  "message": "string",
  "type": "unauthenticated"
}
{
  "detail": "string",
  "message": "string",
  "type": "forbidden"
}
{
  "detail": "string",
  "message": "string",
  "type": "too_many_requests",
  "retry_after": 0
}
{
  "detail": "string",
  "message": "string",
  "type": "internal_error",
  "reference_id": "string"
}
{
  "detail": "string",
  "message": "string",
  "type": "service_unavailable"
}