2022-11-11 02:08:48 +00:00
steps :
# only 1 feeder allowed
# a feeder could be in an "infinite loop" for example: gsheets_infinite feeder which holds-> this could be an easy logic addiction by modifying for each to while not feeder.done() if it becomes necessary
2023-01-04 16:37:36 +00:00
feeder : gsheet_feeder # default -> only expects URL from CLI
2022-11-11 02:08:48 +00:00
archivers : # order matters
- telethon
2022-12-10 12:03:46 +00:00
# - tiktok
# - twitter
# - instagram
# - webarchive # this way it runs as a failsafe only
2022-12-14 14:01:39 +00:00
# enrichers:
# - screenshot
2022-11-24 15:44:25 +00:00
# - wacz
# - webarchive # this way it runs for every case, webarchive extends archiver and enrichment
# - thumbnails
2022-11-11 02:08:48 +00:00
formatters :
- HTMLFormater
2022-11-15 15:00:52 +00:00
- PdfFormater
2022-11-11 02:08:48 +00:00
storages :
- local_storage
- s3
databases :
- gsheets_db
- mongo_db
configurations :
2022-11-15 15:00:52 +00:00
global :
- save_logs : False
2023-01-04 16:37:36 +00:00
gsheet_feeder :
2022-12-14 14:01:39 +00:00
sheet : my-auto-archiver
2022-11-24 15:44:25 +00:00
header : 2 # defaults to 1 in GSheetsFeeder
service_account : "secrets/service_account.json"
2022-12-14 14:01:39 +00:00
# allow_worksheets: "allowed"
# block_worksheets: "blocked1,blocked2"
2022-11-24 15:44:25 +00:00
columns :
'url' : 'link'
'status' : 'archive status'
'folder' : 'destination folder'
'archive' : 'archive location'
'date' : 'archive date'
'thumbnail' : 'thumbnail'
'thumbnail_index' : 'thumbnail index'
'timestamp' : 'upload timestamp'
'title' : 'upload title'
'duration' : 'duration'
'screenshot' : 'screenshot'
'hash' : 'hash'
'wacz' : 'wacz'
'replaywebpage' : 'replaywebpage'
2022-12-14 14:01:39 +00:00
telethon :
api_id : "1234567"
api_hash : "examplehash"
session_file : "secrets/anon"
channel_invites :
- invite : https://t.me/+XXXXXXXXXXXXXX
id : 1000000000
- invite : https://t.me/joinchat/XXXXXXXXXXXXXX
id : 1000000001
2022-11-11 02:08:48 +00:00
tiktok :
2022-11-24 15:44:25 +00:00
api_keys :
- username : 1
password : 2
- username : 3
password : 4
2022-11-11 02:08:48 +00:00
username : "abc"
password : "123"
token : "here"
screenshot :
width : 1280
2022-12-14 14:01:39 +00:00
height : 4600
2022-11-11 02:08:48 +00:00
wacz :
profile : secrets/profile.tar.gz
webarchive :
api_key : "12345"
s3 :
- bucket : 123
- region : "nyc3"
- cdn : "{region}{bucket}"