mirror of
https://github.com/bellingcat/auto-archiver.git
synced 2026-06-11 12:48:28 +03:00
34 lines
1.2 KiB
Python
34 lines
1.2 KiB
Python
{
|
|
"name": "CSV Feeder",
|
|
"type": ["feeder"],
|
|
"dependencies": {"python": ["loguru"], "bin": [""]},
|
|
"requires_setup": True,
|
|
"entry_point": "csv_feeder::CSVFeeder",
|
|
"configs": {
|
|
"files": {
|
|
"default": None,
|
|
"help": "Path to the input file(s) to read the URLs from, comma separated. \
|
|
Input files should be formatted with one URL per line",
|
|
"required": True,
|
|
"type": "valid_file",
|
|
"nargs": "+",
|
|
},
|
|
"column": {
|
|
"default": None,
|
|
"help": "Column number or name to read the URLs from, 0-indexed",
|
|
},
|
|
},
|
|
"description": """
|
|
Reads URLs from CSV files and feeds them into the archiving process.
|
|
|
|
### Features
|
|
- Supports reading URLs from multiple input files, specified as a comma-separated list.
|
|
- Allows specifying the column number or name to extract URLs from.
|
|
- Skips header rows if the first value is not a valid URL.
|
|
|
|
### Setup
|
|
- Input files should be formatted with one URL per line, with or without a header row.
|
|
- If you have a header row, you can specify the column number or name to read URLs from using the 'column' config option.
|
|
""",
|
|
}
|