Permalink
Browse files

archives: add arquivo.pt support, remove hardcoded exclusion

  • Loading branch information...
1 parent a6bd94d commit 8f1370c2ff91ae37c209a2782ff070e0469837f1 @ikreymer ikreymer committed Jun 29, 2016
Showing with 16 additions and 5 deletions.
  1. +5 −1 app/templates/archives-list.html
  2. +7 −0 archives.yaml
  3. +4 −4 pywb/mementoquery.py
@@ -7,10 +7,14 @@
<a target="_blank" href="https://archive.org/web/">Internet Archive</a>
</li>
+ <li data-id="pwa">
+ <a target="_blank" href="http://arquivo.pt/">Portuguese Web Archive</a>
+ </li>
+
<li data-id="ba">
<a target="_blank" href="http://www.bibalex.org/isis/frontend/archive/archive_web.aspx">Bibliotheca Alexandrina Web Archive</a>
</li>
-
+
<li data-id="blarchive">
<a target="_blank" href="http://www.webarchive.org.uk/ukwa/">UK Web Archive</a>
</li>
View
@@ -11,6 +11,12 @@
timemap: http://web.archive.org/web/timemap/link/
link: https://archive.org/web/
+- id: pwa
+ name: Portuguese Web Archive
+ timegate: http://arquivo.pt/wayback/
+ timemap: http://arquivo.pt/wayback/timemap/*/
+ link: http://arquivo.pt/
+
- id: ba
name: Bibliotheca Alexandrina Web Archive
timegate: http://web.archive.bibalex.org/web/
@@ -49,6 +55,7 @@
timemap: https://swap.stanford.edu/timemap/link/
link: https://swap.stanford.edu/
+
# LANL Proxy
- id: es
name: Estonian Web Archive
@@ -19,7 +19,7 @@
from redisclient import redisclient
-EXCLUDE_LIST = ('http://archive.today/', 'http://archive.is', 'https://archive.today/', 'https://archive.is/', 'http://arquivo.pt')
+EXCLUDE_LIST = ('http://archive.today/', 'http://archive.is', 'https://archive.today/', 'https://archive.is/')
#=============================================================================
@@ -259,15 +259,15 @@ def sort_archives(self, archive_list):
else:
yield url
+ if pt:
+ yield pt
+
if ait:
yield ait
if ia:
yield ia
- if pt:
- yield pt
-
def memento_to_cdx(self, url, mem_iter, limit, skip_exclude=True):
key = canonicalize(url)
if url.endswith('/'):

0 comments on commit 8f1370c

Please sign in to comment.