[App] ArchiveBox (#2393)
* [App] ArchiveBox * Update apps/archivebox/metadata/description.md Co-authored-by: coderabbitai[bot] <136622811+coderabbitai[bot]@users.noreply.github.com> * feat(docker=compose): add more env vars for app and their default value --------- Co-authored-by: coderabbitai[bot] <136622811+coderabbitai[bot]@users.noreply.github.com> Co-authored-by: JigSawFr <JigSawFr@users.noreply.github.com>
This commit is contained in:
parent
7bc2fc14a8
commit
c407343e46
35
apps/archivebox/config.json
Executable file
35
apps/archivebox/config.json
Executable file
|
@ -0,0 +1,35 @@
|
|||
{
|
||||
"$schema": "../schema.json",
|
||||
"name": "ArchiveBox",
|
||||
"available": true,
|
||||
"exposable": true,
|
||||
"port": 8015,
|
||||
"id": "archivebox",
|
||||
"tipi_version": 1,
|
||||
"version": "0.7.3",
|
||||
"categories": ["media"],
|
||||
"description": "ArchiveBox is a powerful, self-hosted internet archiving solution to collect, save, and view websites offline.",
|
||||
"short_desc": "Open source self-hosted web archiving.",
|
||||
"author": "archivebox",
|
||||
"source": "https://github.com/ArchiveBox/ArchiveBox",
|
||||
"website": "https://archivebox.io",
|
||||
"form_fields": [
|
||||
{
|
||||
"type": "text",
|
||||
"label": "ArchiveBox Username",
|
||||
"max": 50,
|
||||
"min": 3,
|
||||
"required": true,
|
||||
"env_variable": "ARCHIVEBOX_USERNAME"
|
||||
},
|
||||
{
|
||||
"type": "password",
|
||||
"label": "ArchiveBox Password",
|
||||
"max": 50,
|
||||
"min": 12,
|
||||
"required": true,
|
||||
"env_variable": "ARCHIVEBOX_PASSWORD"
|
||||
}
|
||||
],
|
||||
"supported_architectures": ["arm64", "amd64"]
|
||||
}
|
54
apps/archivebox/docker-compose.yml
Executable file
54
apps/archivebox/docker-compose.yml
Executable file
|
@ -0,0 +1,54 @@
|
|||
services:
|
||||
archivebox:
|
||||
image: archivebox/archivebox:0.7.3
|
||||
restart: unless-stopped
|
||||
container_name: archivebox
|
||||
command: server --quick-init 0.0.0.0:8015
|
||||
environment:
|
||||
- PORT=8015
|
||||
- PUBLIC_INDEX=${ARCHIVEBOX_PUBLIC_INDEX-true} # set to False to prevent anonymous users from viewing snapshot list
|
||||
- PUBLIC_SNAPSHOTS=${ARCHIVEBOX_PUBLIC_SNAPSHOTS-true} # set to False to prevent anonymous users from viewing snapshot content
|
||||
- PUBLIC_ADD_VIEW=${ARCHIVEBOX_PUBLIC_ADD_VIEW-false} # set to True to allow anonymous users to submit new URLs to archive
|
||||
- ADMIN_USERNAME=${ARCHIVEBOX_USERNAME} # create an admin user on first run with the given user/pass combo
|
||||
- ADMIN_PASSWORD=${ARCHIVEBOX_PASSWORD}
|
||||
- PUID=1000 # set to your host user's UID & GID if you encounter permissions issues
|
||||
- PGID=1000
|
||||
- SEARCH_BACKEND_ENGINE=${ARCHIVEBOX_SEARCH_BACKEND_ENGINE} # uncomment these and sonic container below for better full-text search
|
||||
- SEARCH_BACKEND_HOST_NAME=${ARCHIVEBOX_SEARCH_BACKEND_HOST_NAME}
|
||||
- SEARCH_BACKEND_PASSWORD=${ARCHIVEBOX_SEARCH_BACKEND_PASSWORD}
|
||||
- MEDIA_MAX_SIZE=${ARCHIVEBOX_MEDIA_MAX_SIZE-750m} # increase this filesize limit to allow archiving larger audio/video files
|
||||
- TIMEOUT=${ARCHIVEBOX_TIMEOUT-60} # increase this number to 120+ seconds if you see many slow downloads timing out
|
||||
- CHECK_SSL_VALIDITY=${ARCHIVEBOX_CHECK_SSL_VALIDITY-true} # set to False to disable strict SSL checking (allows saving URLs w/ broken certs)
|
||||
- SAVE_ARCHIVE_DOT_ORG=${ARCHIVEBOX_SAVE_ARCHIVE_DOT_ORGE-true} # set to False to disable submitting all URLs to Archive.org when archiving
|
||||
networks:
|
||||
- tipi_main_network
|
||||
ports:
|
||||
- "${APP_PORT}:8015"
|
||||
volumes:
|
||||
- "${APP_DATA_DIR}/data:/data"
|
||||
- "${APP_DATA_DIR}/crontabs:/var/spool/cron/crontabs"
|
||||
labels:
|
||||
# Main
|
||||
traefik.enable: true
|
||||
traefik.http.middlewares.archivebox-web-redirect.redirectscheme.scheme: https
|
||||
traefik.http.services.archivebox.loadbalancer.server.port: 8015
|
||||
# Web
|
||||
traefik.http.routers.archivebox-insecure.rule: Host(`${APP_DOMAIN}`)
|
||||
traefik.http.routers.archivebox-insecure.entrypoints: web
|
||||
traefik.http.routers.archivebox-insecure.service: archivebox
|
||||
traefik.http.routers.archivebox-insecure.middlewares: archivebox-web-redirect
|
||||
# Websecure
|
||||
traefik.http.routers.archivebox.rule: Host(`${APP_DOMAIN}`)
|
||||
traefik.http.routers.archivebox.entrypoints: websecure
|
||||
traefik.http.routers.archivebox.service: archivebox
|
||||
traefik.http.routers.archivebox.tls.certresolver: myresolver
|
||||
# Local domain
|
||||
traefik.http.routers.archivebox-local-insecure.rule: Host(`archivebox.${LOCAL_DOMAIN}`)
|
||||
traefik.http.routers.archivebox-local-insecure.entrypoints: web
|
||||
traefik.http.routers.archivebox-local-insecure.service: archivebox
|
||||
traefik.http.routers.archivebox-local-insecure.middlewares: archivebox-web-redirect
|
||||
# Local domain secure
|
||||
traefik.http.routers.archivebox-local.rule: Host(`archivebox.${LOCAL_DOMAIN}`)
|
||||
traefik.http.routers.archivebox-local.entrypoints: websecure
|
||||
traefik.http.routers.archivebox-local.service: archivebox
|
||||
traefik.http.routers.archivebox-local.tls: true
|
24
apps/archivebox/metadata/description.md
Executable file
24
apps/archivebox/metadata/description.md
Executable file
|
@ -0,0 +1,24 @@
|
|||
# ArchiveBox
|
||||
|
||||
ArchiveBox is a powerful, self-hosted internet archiving solution to collect, save, and view websites offline.
|
||||
|
||||
---
|
||||
|
||||
![](https://github.com/ArchiveBox/ArchiveBox/assets/511499/90f1ce3c-75bb-401d-88ed-6297694b76ae?raw=true)
|
||||
|
||||
---
|
||||
|
||||
Without active preservation effort, everything on the internet eventually disappears or degrades. Archive.org does a great job as a centralized service, but saved URLs have to be public, and they can't save every type of content.
|
||||
|
||||
ArchiveBox is an open source tool that lets organizations & individuals archive both public & private web content while retaining control over their data. It can be used to save copies of bookmarks, preserve evidence for legal cases, backup photos from FB/Insta/Flickr or media from YT/Soundcloud/etc., save research papers, and more...
|
||||
|
||||
📥 **You can feed ArchiveBox URLs one at a time, or schedule regular imports** from your bookmarks or history, social media feeds or RSS, link-saving services like Pocket/Pinboard, our [Browser Extension](https://chromewebstore.google.com/detail/archivebox-exporter/habonpimjphpdnmcfkaockjnffodikoj), and more.
|
||||
|
||||
**It saves snapshots of the URLs you feed it in several redundant formats.**
|
||||
It also detects any content featured *inside* pages & extracts it out into a folder:
|
||||
|
||||
- 🌐 **HTML**/**Any websites** ➡️ `original HTML+CSS+JS`, `singlefile HTML`, `screenshot PNG`, `PDF`, `WARC`, `title`, `article text`, `favicon`, `headers`, ...
|
||||
- 🎥 **Social Media**/**News** ➡️ `post content TXT`, `comments`, `title`, `author`, `images`, ...
|
||||
- 🎬 **YouTube**/**SoundCloud**/etc. ➡️ `MP3/MP4`s, `subtitles`, `metadata`, `thumbnail`, ...
|
||||
- 💾 **Github**/**Gitlab**/etc. links ➡️ `clone of GIT source code`, `README`, `images`, ...
|
||||
- ✨ *and more ...
|
BIN
apps/archivebox/metadata/logo.jpg
Executable file
BIN
apps/archivebox/metadata/logo.jpg
Executable file
Binary file not shown.
After Width: | Height: | Size: 17 KiB |
Loading…
Reference in New Issue
Block a user