cli_schedule
Schedule automated web archiving tasks to regularly capture and preserve website snapshots at specified intervals with customizable crawl settings.
Instructions
Execute archivebox schedule command.
Input Schema
| Name | Required | Description | Default |
|---|---|---|---|
| import_path | No | Path to import file | |
| add | No | Enable adding new URLs | |
| every | No | Schedule frequency (e.g., 'daily') | |
| tag | No | Comma-separated tags | |
| depth | No | Crawl depth | |
| overwrite | No | Overwrite existing files | |
| update | No | Update existing snapshots | |
| clear | No | Clear existing schedules | |
| extra_data | No | Additional parameters as a dictionary |
Input Schema (JSON Schema)
{
"properties": {
"add": {
"default": false,
"description": "Enable adding new URLs",
"type": "boolean"
},
"clear": {
"default": false,
"description": "Clear existing schedules",
"type": "boolean"
},
"depth": {
"default": 0,
"description": "Crawl depth",
"type": "integer"
},
"every": {
"anyOf": [
{
"type": "string"
},
{
"type": "null"
}
],
"default": null,
"description": "Schedule frequency (e.g., 'daily')"
},
"extra_data": {
"anyOf": [
{
"additionalProperties": true,
"type": "object"
},
{
"type": "null"
}
],
"default": null,
"description": "Additional parameters as a dictionary"
},
"import_path": {
"anyOf": [
{
"type": "string"
},
{
"type": "null"
}
],
"default": null,
"description": "Path to import file"
},
"overwrite": {
"default": false,
"description": "Overwrite existing files",
"type": "boolean"
},
"tag": {
"default": "",
"description": "Comma-separated tags",
"type": "string"
},
"update": {
"default": false,
"description": "Update existing snapshots",
"type": "boolean"
}
},
"type": "object"
}