ArchiveBox/archivebox/core/views.py

138 lines
4.2 KiB
Python
Raw Normal View History

__package__ = 'archivebox.core'
2019-04-02 20:36:41 +00:00
from django.shortcuts import render, redirect
2019-04-17 09:42:21 +00:00
from django.http import HttpResponse
from django.views import View, static
2019-05-01 03:44:51 +00:00
from core.models import Snapshot
from contextlib import redirect_stdout
from io import StringIO
from ..index import load_main_index, load_main_index_meta
from ..config import (
OUTPUT_DIR,
VERSION,
FOOTER_INFO,
PUBLIC_INDEX,
PUBLIC_SNAPSHOTS,
)
from ..util import base_url, ansi_to_html
2020-03-27 12:37:31 +00:00
from .. main import add
from .forms import AddLinkForm
2019-04-17 09:42:21 +00:00
class MainIndex(View):
template = 'main_index.html'
def get(self, request):
if not request.user.is_authenticated and not PUBLIC_INDEX:
return redirect(f'/admin/login/?next={request.path}')
all_links = load_main_index(out_dir=OUTPUT_DIR)
meta_info = load_main_index_meta(out_dir=OUTPUT_DIR)
context = {
'updated': meta_info['updated'],
'num_links': meta_info['num_links'],
'links': all_links,
'VERSION': VERSION,
'FOOTER_INFO': FOOTER_INFO,
}
return render(template_name=self.template, request=request, context=context)
class AddLinks(View):
template = 'add_links.html'
def get(self, request):
if not request.user.is_authenticated and not PUBLIC_INDEX:
return redirect(f'/admin/login/?next={request.path}')
context = {
"form": AddLinkForm()
}
return render(template_name=self.template, request=request, context=context)
def post(self, request):
if not request.user.is_authenticated and not PUBLIC_INDEX:
return redirect(f'/admin/login/?next={request.path}')
form = AddLinkForm(request.POST)
if form.is_valid():
url = form.cleaned_data["url"]
2020-07-01 17:29:56 +00:00
print(f'[+] Adding URL: {url}')
2020-07-13 16:21:37 +00:00
depth = 0 if form.cleaned_data["depth"] == "0" else 0
input_kwargs = {
2020-07-13 16:21:37 +00:00
"urls": url,
"depth": depth,
"update_all": False,
"out_dir": OUTPUT_DIR,
}
2020-07-01 17:29:56 +00:00
add_stdout = StringIO()
with redirect_stdout(add_stdout):
add(**input_kwargs)
2020-07-01 17:29:56 +00:00
print(add_stdout.getvalue())
context = {
"stdout": ansi_to_html(add_stdout.getvalue()),
"form": AddLinkForm()
2020-07-01 17:29:56 +00:00
}
else:
context = {"form": form}
return render(template_name=self.template, request=request, context=context)
2019-04-17 09:42:21 +00:00
class LinkDetails(View):
def get(self, request, path):
# missing trailing slash -> redirect to index
if '/' not in path:
return redirect(f'{path}/index.html')
if not request.user.is_authenticated and not PUBLIC_SNAPSHOTS:
return redirect(f'/admin/login/?next={request.path}')
try:
slug, archivefile = path.split('/', 1)
except (IndexError, ValueError):
slug, archivefile = path.split('/', 1)[0], 'index.html'
2019-05-01 03:44:51 +00:00
all_pages = list(Snapshot.objects.all())
# slug is a timestamp
by_ts = {page.timestamp: page for page in all_pages}
try:
response = static.serve(request, archivefile, by_ts[slug].link_dir, show_indexes=True)
response["Link"] = f'<{by_ts[slug].url}>; rel="canonical"'
return response
except KeyError:
pass
# slug is a hash
by_hash = {page.url_hash: page for page in all_pages}
try:
timestamp = by_hash[slug].timestamp
return redirect(f'/archive/{timestamp}/{archivefile}')
except KeyError:
pass
# slug is a URL
by_url = {page.base_url: page for page in all_pages}
try:
# TODO: add multiple snapshot support by showing index of all snapshots
# for given url instead of redirecting to timestamp index
timestamp = by_url[base_url(path)].timestamp
return redirect(f'/archive/{timestamp}/index.html')
except KeyError:
pass
return HttpResponse(
'No archived link matches the given timestamp or hash.',
content_type="text/plain",
status=404,
)