example.config.yaml 3.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697
  1. ---
  2. secrets:
  3. # needed if you use storage=s3
  4. s3:
  5. # contains S3 info on region, bucket, key and secret
  6. region: reg1
  7. bucket: my-bucket
  8. key: "s3 API key"
  9. secret: "s3 API secret"
  10. # use region format like such
  11. endpoint_url: "https://{region}.digitaloceanspaces.com"
  12. #use bucket, region, and key (key is the archived file path generated when executing) format like such as:
  13. cdn_url: "https://{bucket}.{region}.cdn.digitaloceanspaces.com/{key}"
  14. # if private:true S3 urls will not be readable online
  15. private: false
  16. # with 'random' you can generate a random UUID for the URL instead of a predictable path, useful to still have public but unlisted files, alternative is 'default' or not omitted from config
  17. key_path: random
  18. # needed if you use storage=gd
  19. google_drive:
  20. # local filename can be the same or different file from google_sheets.service_account, defaults to service_account.json
  21. service_account: "service_account.json"
  22. root_folder_id: copy XXXX from https://drive.google.com/drive/folders/XXXX
  23. # needed if you use storage=local
  24. local:
  25. # local path to save files in
  26. save_to: "./local_archive"
  27. wayback:
  28. # to get credentials visit https://archive.org/account/s3.php
  29. key: your API key
  30. secret: your API secret
  31. telegram:
  32. # to get credentials see: https://telegra.ph/How-to-get-Telegram-APP-ID--API-HASH-05-27
  33. api_id: your API key, see
  34. api_hash: your API hash
  35. # optional, but allows access to more content such as large videos, talk to @botfather
  36. bot_token: your bot-token
  37. # twitter configuration - API V2 only
  38. # if you don't provide credentials the less-effective unofficial TwitterArchiver will be used instead
  39. twitter:
  40. # either bearer_token only
  41. bearer_token: ""
  42. # OR all of the below
  43. consumer_key: ""
  44. consumer_secret: ""
  45. access_token: ""
  46. access_secret: ""
  47. # vkontakte (vk.com) credentials
  48. vk:
  49. username: "phone number or email"
  50. password: "password"
  51. google_sheets:
  52. # local filename: defaults to service_account.json, see https://gspread.readthedocs.io/en/latest/oauth2.html#for-bots-using-service-account
  53. service_account: "service_account.json"
  54. facebook:
  55. # optional facebook cookie to have more access to content, from browser, looks like 'cookie: datr= xxxx'
  56. cookie: ""
  57. execution:
  58. # can be overwritten with CMD --sheet=
  59. sheet: your-sheet-name
  60. # which row of your tabs contains the header, can be overwritten with CMD --header=
  61. header: 1
  62. # which storage to use, can be overwritten with CMD --storage=
  63. storage: s3
  64. # defaults to false, when true will try to avoid duplicate URL archives
  65. check_if_exists: true
  66. # optional configurations for the selenium browser that takes screenshots, these are the defaults
  67. selenium:
  68. # values under 10s might mean screenshots fail to grab screenshot
  69. timeout_seconds: 120
  70. window_width: 1400
  71. window_height: 2000
  72. # puts execution logs into /logs folder, defaults to false
  73. save_logs: true
  74. # custom column names, only needed if different from default, can be overwritten with CMD --col-NAME="VALUE"
  75. # url and status are the only columns required to be present in the google sheet
  76. column_names:
  77. url: link
  78. status: archive status
  79. archive: archive location
  80. # use this column to override default location data
  81. folder: folder
  82. date: archive date
  83. thumbnail: thumbnail
  84. thumbnail_index: thumbnail index
  85. timestamp: upload timestamp
  86. title: upload title
  87. duration: duration
  88. screenshot: screenshot
  89. hash: hash