Item archiveteam_archivebot_go_20171101170001

View on Internet Archive

Filename Size
addons.mozilla.org-inf-20170829-025732-4aa66-00215.warc.gz 5376060854 download   job
addons.mozilla.org-inf-20170829-025732-4aa66-00215.warc.os.cdx.gz 4937588 download
addons.mozilla.org-inf-20170829-025732-4aa66-00216.warc.gz 5379802225 download   job
addons.mozilla.org-inf-20170829-025732-4aa66-00216.warc.os.cdx.gz 3122177 download
addons.mozilla.org-inf-20170829-025732-4aa66-00217.warc.gz 5368771421 download   job
addons.mozilla.org-inf-20170829-025732-4aa66-00217.warc.os.cdx.gz 2664527 download
analisiocupaciopublica.gencat.cat-inf-20171101-053839-irfuy-00000.warc.gz 15448420 download   job
analisiocupaciopublica.gencat.cat-inf-20171101-053839-irfuy-00000.warc.os.cdx.gz 50805 download
analisiocupaciopublica.gencat.cat-inf-20171101-053839-irfuy-meta.warc.gz 33490 download   job
analisiocupaciopublica.gencat.cat-inf-20171101-053839-irfuy-meta.warc.os.cdx.gz 47 download
analisiocupaciopublica.gencat.cat-inf-20171101-053839-irfuy.json 263 download   job
aplicacions.aca.gencat.cat-inf-20171101-053044-luucw-00000.warc.gz 10397140 download   job
aplicacions.aca.gencat.cat-inf-20171101-053044-luucw-00000.warc.os.cdx.gz 44687 download
aplicacions.aca.gencat.cat-inf-20171101-053044-luucw-meta.warc.gz 29449 download   job
aplicacions.aca.gencat.cat-inf-20171101-053044-luucw-meta.warc.os.cdx.gz 47 download
aplicacions.aca.gencat.cat-inf-20171101-053044-luucw.json 257 download   job
apnews.com-shallow-20171031-223635-9w9fm-00000.warc.gz 3391328 download   job
apnews.com-shallow-20171031-223635-9w9fm-00000.warc.os.cdx.gz 15962 download
apnews.com-shallow-20171031-223635-9w9fm-meta.warc.gz 12478 download   job
apnews.com-shallow-20171031-223635-9w9fm-meta.warc.os.cdx.gz 47 download
apnews.com-shallow-20171031-223635-9w9fm.json 335 download   job
archiveteam_archivebot_go_20171101170001.cdx.gz 129880595 download
archiveteam_archivebot_go_20171101170001.cdx.idx 138576 download
archiveteam_archivebot_go_20171101170001_archive.torrent 861508 download
archiveteam_archivebot_go_20171101170001_files.xml 0 download
archiveteam_archivebot_go_20171101170001_meta.sqlite 291840 download
archiveteam_archivebot_go_20171101170001_meta.xml 1009 download
bibliotecadigital.fgv.br-shallow-20171101-140122-cjjaj-00000.warc.gz 894758 download   job
bibliotecadigital.fgv.br-shallow-20171101-140122-cjjaj-00000.warc.os.cdx.gz 259 download
bibliotecadigital.fgv.br-shallow-20171101-140122-cjjaj-meta.warc.gz 3558 download   job
bibliotecadigital.fgv.br-shallow-20171101-140122-cjjaj-meta.warc.os.cdx.gz 47 download
bibliotecadigital.fgv.br-shallow-20171101-140122-cjjaj.json 302 download   job
blog.architecting.it-shallow-20171101-152847-5bmvd-00000.warc.gz 2312849 download   job
blog.architecting.it-shallow-20171101-152847-5bmvd-00000.warc.os.cdx.gz 6412 download
blog.architecting.it-shallow-20171101-152847-5bmvd-meta.warc.gz 7278 download   job
blog.architecting.it-shallow-20171101-152847-5bmvd-meta.warc.os.cdx.gz 47 download
blog.architecting.it-shallow-20171101-152847-5bmvd.json 266 download   job
blog.ircmaxell.com-shallow-20171101-135537-eyaow-00000.warc.gz 441642 download   job
blog.ircmaxell.com-shallow-20171101-135537-eyaow-00000.warc.os.cdx.gz 3071 download
blog.ircmaxell.com-shallow-20171101-135537-eyaow-meta.warc.gz 5406 download   job
blog.ircmaxell.com-shallow-20171101-135537-eyaow-meta.warc.os.cdx.gz 47 download
blog.ircmaxell.com-shallow-20171101-135537-eyaow.json 315 download   job
consumerist.com-inf-20171030-235804-4xyuq-00002.warc.gz 5368716489 download   job
consumerist.com-inf-20171030-235804-4xyuq-00002.warc.os.cdx.gz 5544116 download
consumerist.com-inf-20171030-235804-4xyuq-00003.warc.gz 5368756227 download   job
consumerist.com-inf-20171030-235804-4xyuq-00003.warc.os.cdx.gz 4923491 download
consumerist.com-inf-20171030-235804-4xyuq-00004.warc.gz 5368994727 download   job
consumerist.com-inf-20171030-235804-4xyuq-00004.warc.os.cdx.gz 4320916 download
consumerist.com-inf-20171030-235804-4xyuq-00005.warc.gz 5392429764 download   job
consumerist.com-inf-20171030-235804-4xyuq-00005.warc.os.cdx.gz 3781968 download
consumerist.com-inf-20171030-235804-4xyuq-00006.warc.gz 5368844382 download   job
consumerist.com-inf-20171030-235804-4xyuq-00006.warc.os.cdx.gz 344758 download
download.unirc.eu-inf-20171030-225936-5to3m-00002.warc.gz 5499672133 download   job
download.unirc.eu-inf-20171030-225936-5to3m-00002.warc.os.cdx.gz 15789 download
download.unirc.eu-inf-20171030-225936-5to3m-00003.warc.gz 5863731019 download   job
download.unirc.eu-inf-20171030-225936-5to3m-00003.warc.os.cdx.gz 59765 download
dps.gencat.cat-inf-20171101-053459-9m46j-00000.warc.gz 7361 download   job
dps.gencat.cat-inf-20171101-053459-9m46j-00000.warc.os.cdx.gz 261 download
dps.gencat.cat-inf-20171101-053459-9m46j-meta.warc.gz 3509 download   job
dps.gencat.cat-inf-20171101-053459-9m46j-meta.warc.os.cdx.gz 47 download
dps.gencat.cat-inf-20171101-053459-9m46j.json 245 download   job
maklerejo.de-inf-20171101-152746-7pj2l-00000.warc.gz 74760 download   job
maklerejo.de-inf-20171101-152746-7pj2l-00000.warc.os.cdx.gz 349 download
maklerejo.de-inf-20171101-152746-7pj2l-meta.warc.gz 3552 download   job
maklerejo.de-inf-20171101-152746-7pj2l-meta.warc.os.cdx.gz 47 download
maklerejo.de-inf-20171101-152746-7pj2l.json 242 download   job
matthew.house-inf-20171101-151058-8i4hs-00000.warc.gz 90638779 download   job
matthew.house-inf-20171101-151058-8i4hs-00000.warc.os.cdx.gz 175958 download
matthew.house-inf-20171101-151058-8i4hs-meta.warc.gz 141554 download   job
matthew.house-inf-20171101-151058-8i4hs-meta.warc.os.cdx.gz 47 download
matthew.house-inf-20171101-151058-8i4hs.json 243 download   job
mediatormatthew.com-inf-20171101-152446-er1up-00000.warc.gz 20098532 download   job
mediatormatthew.com-inf-20171101-152446-er1up-00000.warc.os.cdx.gz 36389 download
mediatormatthew.com-inf-20171101-152446-er1up-meta.warc.gz 25930 download   job
mediatormatthew.com-inf-20171101-152446-er1up-meta.warc.os.cdx.gz 47 download
mediatormatthew.com-inf-20171101-152446-er1up.json 249 download   job
noticias.uol.com.br-shallow-20171101-125657-cfmx9-00000.warc.gz 44736 download   job
noticias.uol.com.br-shallow-20171101-125657-cfmx9-00000.warc.os.cdx.gz 1166 download
noticias.uol.com.br-shallow-20171101-125657-cfmx9-meta.warc.gz 4297 download   job
noticias.uol.com.br-shallow-20171101-125657-cfmx9-meta.warc.os.cdx.gz 47 download
noticias.uol.com.br-shallow-20171101-125657-cfmx9.json 286 download   job
pirata.cat-inf-20171101-054244-d2f5a-00000.warc.gz 5370932280 download   job
pirata.cat-inf-20171101-054244-d2f5a-00000.warc.os.cdx.gz 3412559 download
pirata.cat-inf-20171101-054244-d2f5a-00001.warc.gz 624366253 download   job
pirata.cat-inf-20171101-054244-d2f5a-00001.warc.os.cdx.gz 721814 download
pirata.cat-inf-20171101-054244-d2f5a-meta.warc.gz 2636745 download   job
pirata.cat-inf-20171101-054244-d2f5a-meta.warc.os.cdx.gz 47 download
pirata.cat-inf-20171101-054244-d2f5a.json 240 download   job
preproduccio.aplicacions.aca.gencat.cat-inf-20171101-053510-bzxxp-00000.warc.gz 10941737 download   job
preproduccio.aplicacions.aca.gencat.cat-inf-20171101-053510-bzxxp-00000.warc.os.cdx.gz 44664 download
preproduccio.aplicacions.aca.gencat.cat-inf-20171101-053510-bzxxp-meta.warc.gz 29341 download   job
preproduccio.aplicacions.aca.gencat.cat-inf-20171101-053510-bzxxp-meta.warc.os.cdx.gz 47 download
preproduccio.aplicacions.aca.gencat.cat-inf-20171101-053510-bzxxp.json 270 download   job
s.zeptobars.com-shallow-20171101-064805-36txo-00000.warc.gz 302629737 download   job
s.zeptobars.com-shallow-20171101-064805-36txo-00000.warc.os.cdx.gz 243 download
s.zeptobars.com-shallow-20171101-064805-36txo-meta.warc.gz 3529 download   job
s.zeptobars.com-shallow-20171101-064805-36txo-meta.warc.os.cdx.gz 47 download
s.zeptobars.com-shallow-20171101-064805-36txo.json 271 download   job
s.zeptobars.com-shallow-20171101-065822-4bn9j-00000.warc.gz 210154284 download   job
s.zeptobars.com-shallow-20171101-065822-4bn9j-00000.warc.os.cdx.gz 246 download
s.zeptobars.com-shallow-20171101-065822-4bn9j-meta.warc.gz 3525 download   job
s.zeptobars.com-shallow-20171101-065822-4bn9j-meta.warc.os.cdx.gz 47 download
s.zeptobars.com-shallow-20171101-065822-4bn9j.json 272 download   job
solarroadways.com-shallow-20171101-135204-8r832-00000.warc.gz 5541 download   job
solarroadways.com-shallow-20171101-135204-8r832-00000.warc.os.cdx.gz 209 download
solarroadways.com-shallow-20171101-135204-8r832-meta.warc.gz 3378 download   job
solarroadways.com-shallow-20171101-135204-8r832-meta.warc.os.cdx.gz 47 download
solarroadways.com-shallow-20171101-135204-8r832.json 245 download   job
twitter.com-inf-20171028-124956-ew8yg-00000.warc.gz 301462362 download   job
twitter.com-inf-20171028-124956-ew8yg-00000.warc.os.cdx.gz 426286 download
twitter.com-inf-20171028-124956-ew8yg.json 250 download   job
twitter.com-shallow-20171031-224350-d3je9-00000.warc.gz 983534 download   job
twitter.com-shallow-20171031-224350-d3je9-00000.warc.os.cdx.gz 4556 download
twitter.com-shallow-20171031-224350-d3je9-meta.warc.gz 6522 download   job
twitter.com-shallow-20171031-224350-d3je9-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171031-224350-d3je9.json 267 download   job
twitter.com-shallow-20171031-230309-4p559-00000.warc.gz 1823920 download   job
twitter.com-shallow-20171031-230309-4p559-00000.warc.os.cdx.gz 4726 download
twitter.com-shallow-20171031-230309-4p559-meta.warc.gz 6571 download   job
twitter.com-shallow-20171031-230309-4p559-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171031-230309-4p559.json 248 download   job
twitter.com-shallow-20171101-075417-cdaod-00000.warc.gz 2012183 download   job
twitter.com-shallow-20171101-075417-cdaod-00000.warc.os.cdx.gz 4902 download
twitter.com-shallow-20171101-075417-cdaod-meta.warc.gz 6660 download   job
twitter.com-shallow-20171101-075417-cdaod-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075417-cdaod.json 255 download   job
twitter.com-shallow-20171101-075449-68792-00000.warc.gz 1893489 download   job
twitter.com-shallow-20171101-075449-68792-00000.warc.os.cdx.gz 5411 download
twitter.com-shallow-20171101-075449-68792-meta.warc.gz 6982 download   job
twitter.com-shallow-20171101-075449-68792-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075449-68792.json 260 download   job
twitter.com-shallow-20171101-075540-86yif-00000.warc.gz 4583447 download   job
twitter.com-shallow-20171101-075540-86yif-00000.warc.os.cdx.gz 5940 download
twitter.com-shallow-20171101-075540-86yif-meta.warc.gz 7350 download   job
twitter.com-shallow-20171101-075540-86yif-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075540-86yif.json 259 download   job
twitter.com-shallow-20171101-075558-f4ii2-00000.warc.gz 2713510 download   job
twitter.com-shallow-20171101-075558-f4ii2-00000.warc.os.cdx.gz 5779 download
twitter.com-shallow-20171101-075558-f4ii2-meta.warc.gz 7258 download   job
twitter.com-shallow-20171101-075558-f4ii2-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075558-f4ii2.json 259 download   job
twitter.com-shallow-20171101-075616-48kpn-00000.warc.gz 3303617 download   job
twitter.com-shallow-20171101-075616-48kpn-00000.warc.os.cdx.gz 5855 download
twitter.com-shallow-20171101-075616-48kpn-meta.warc.gz 7316 download   job
twitter.com-shallow-20171101-075616-48kpn-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075616-48kpn.json 259 download   job
twitter.com-shallow-20171101-075632-7o3hq-00000.warc.gz 2318791 download   job
twitter.com-shallow-20171101-075632-7o3hq-00000.warc.os.cdx.gz 5835 download
twitter.com-shallow-20171101-075632-7o3hq-meta.warc.gz 7326 download   job
twitter.com-shallow-20171101-075632-7o3hq-meta.warc.os.cdx.gz 47 download
twitter.com-shallow-20171101-075632-7o3hq.json 259 download   job
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-00001.warc.gz 5368837197 download   job
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-00001.warc.os.cdx.gz 2837168 download
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-00002.warc.gz 183452405 download   job
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-00002.warc.os.cdx.gz 308552 download
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-meta.warc.gz 6007598 download   job
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-meta.warc.os.cdx.gz 47 download
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w-urls.txt 1650000 download
urls-a.uguu.se-AfN4WZ5605VJ_nn.txt-shallow-20171031-104145-9hn4w.json 294 download   job
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00000.warc.gz 5380794050 download   job
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00000.warc.os.cdx.gz 5140091 download
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00001.warc.gz 5368954968 download   job
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00001.warc.os.cdx.gz 3412041 download
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00002.warc.gz 400963148 download   job
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-00002.warc.os.cdx.gz 421179 download
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-meta.warc.gz 5602136 download   job
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-meta.warc.os.cdx.gz 47 download
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c-urls.txt 1650000 download
urls-a.uguu.se-g4cbd6yaxUzb_nn.txt-shallow-20171031-190206-aph2c.json 294 download   job
urls-a.uguu.se-zOmsoPby1SZM_nn.txt-shallow-20171101-163722-2l02x-aborted-00000.warc.gz 32731412 download   job
urls-a.uguu.se-zOmsoPby1SZM_nn.txt-shallow-20171101-163722-2l02x-aborted-00000.warc.os.cdx.gz 149703 download
urls-a.uguu.se-zOmsoPby1SZM_nn.txt-shallow-20171101-163722-2l02x-aborted.json 293 download   job
urls-a.uguu.se-zOmsoPby1SZM_nn.txt-shallow-20171101-163722-2l02x-urls.txt 1650000 download
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x-00000.warc.gz 2054608008 download   job
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x-00000.warc.os.cdx.gz 2618201 download
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x-meta.warc.gz 1609338 download   job
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x-meta.warc.os.cdx.gz 47 download
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x-urls.txt 668813 download
urls-gist.github.com-slingshotesports.com-shallow-20171031-225927-dbb0x.json 482 download   job
urls-gist.githubusercontent.com-fcbarcelona-websites-inf-20171031-101030-d6okg-00000.warc.gz 5369953369 download   job
urls-gist.githubusercontent.com-fcbarcelona-websites-inf-20171031-101030-d6okg-00000.warc.os.cdx.gz 4493501 download
urls-gist.githubusercontent.com-fcbarcelona-websites-inf-20171031-101030-d6okg-00001.warc.gz 5369342746 download   job
urls-gist.githubusercontent.com-fcbarcelona-websites-inf-20171031-101030-d6okg-00001.warc.os.cdx.gz 4911351 download
urls-gist.githubusercontent.com-gistfile1.txt-inf-20171023-065909-er537-00013.warc.gz 5368709153 download   job
urls-gist.githubusercontent.com-gistfile1.txt-inf-20171023-065909-er537-00013.warc.os.cdx.gz 15484959 download
urls-gist.githubusercontent.com-gistfile1.txt-inf-20171023-065909-er537-00014.warc.gz 5443167031 download   job
urls-gist.githubusercontent.com-gistfile1.txt-inf-20171023-065909-er537-00014.warc.os.cdx.gz 2072637 download
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy-00000.warc.gz 11367345 download   job
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy-00000.warc.os.cdx.gz 36706 download
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy-meta.warc.gz 27873 download   job
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy-meta.warc.os.cdx.gz 47 download
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy-urls.txt 20767 download
urls-gist.githubusercontent.com-gistfile1.txt-shallow-20171101-022700-1luuy.json 496 download   job
urls-gist.githubusercontent.com-noblogs-inf-20170909-231906-4g2vk-00193.warc.gz 5368744410 download   job
urls-gist.githubusercontent.com-noblogs-inf-20170909-231906-4g2vk-00193.warc.os.cdx.gz 5613230 download
web.archive.org-shallow-20171101-140941-89jct-00000.warc.gz 9630 download   job
web.archive.org-shallow-20171101-140941-89jct-00000.warc.os.cdx.gz 352 download
web.archive.org-shallow-20171101-140941-89jct-meta.warc.gz 3704 download   job
web.archive.org-shallow-20171101-140941-89jct-meta.warc.os.cdx.gz 47 download
web.archive.org-shallow-20171101-140941-89jct.json 398 download   job
www.academia.edu-shallow-20171101-143056-dh6pt-00000.warc.gz 97060189 download   job
www.academia.edu-shallow-20171101-143056-dh6pt-00000.warc.os.cdx.gz 63456 download
www.academia.edu-shallow-20171101-143056-dh6pt-meta.warc.gz 49560 download   job
www.academia.edu-shallow-20171101-143056-dh6pt-meta.warc.os.cdx.gz 47 download
www.academia.edu-shallow-20171101-143056-dh6pt.json 369 download   job
www.baseball-almanac.com-inf-20171028-032945-ee4m8-00000.warc.gz 5383768175 download   job
www.baseball-almanac.com-inf-20171028-032945-ee4m8-00000.warc.os.cdx.gz 11419207 download
www.bbc.co.uk-shallow-20171031-224045-2n4az-00000.warc.gz 4914306 download   job
www.bbc.co.uk-shallow-20171031-224045-2n4az-00000.warc.os.cdx.gz 16500 download
www.bbc.co.uk-shallow-20171031-224045-2n4az-meta.warc.gz 13085 download   job
www.bbc.co.uk-shallow-20171031-224045-2n4az-meta.warc.os.cdx.gz 47 download
www.bbc.co.uk-shallow-20171031-224045-2n4az.json 270 download   job
www.cl.cam.ac.uk-shallow-20171101-053252-60bcv-00000.warc.gz 10611876 download   job
www.cl.cam.ac.uk-shallow-20171101-053252-60bcv-00000.warc.os.cdx.gz 249 download
www.cl.cam.ac.uk-shallow-20171101-053252-60bcv-meta.warc.gz 3503 download   job
www.cl.cam.ac.uk-shallow-20171101-053252-60bcv-meta.warc.os.cdx.gz 47 download
www.cl.cam.ac.uk-shallow-20171101-053252-60bcv.json 276 download   job
www.cl.cam.ac.uk-shallow-20171101-053308-6wopf-00000.warc.gz 8363928 download   job
www.cl.cam.ac.uk-shallow-20171101-053308-6wopf-00000.warc.os.cdx.gz 244 download
www.cl.cam.ac.uk-shallow-20171101-053308-6wopf-meta.warc.gz 3519 download   job
www.cl.cam.ac.uk-shallow-20171101-053308-6wopf-meta.warc.os.cdx.gz 47 download
www.cl.cam.ac.uk-shallow-20171101-053308-6wopf.json 277 download   job
www.dslreports.com-shallow-20171031-235429-3jdfa-00000.warc.gz 421495 download   job
www.dslreports.com-shallow-20171031-235429-3jdfa-00000.warc.os.cdx.gz 3398 download
www.dslreports.com-shallow-20171031-235429-3jdfa-meta.warc.gz 5922 download   job
www.dslreports.com-shallow-20171031-235429-3jdfa-meta.warc.os.cdx.gz 47 download
www.dslreports.com-shallow-20171031-235429-3jdfa.json 326 download   job
www.foxnews.com-shallow-20171030-151146-d7apf-00000.warc.gz 78219 download   job
www.foxnews.com-shallow-20171030-151146-d7apf-00000.warc.os.cdx.gz 927 download
www.foxnews.com-shallow-20171030-151146-d7apf.json 324 download   job
www.foxnews.com-shallow-20171031-205711-awo99-00000.warc.gz 1666908089 download   job
www.foxnews.com-shallow-20171031-205711-awo99-00000.warc.os.cdx.gz 20593 download
www.foxnews.com-shallow-20171031-205711-awo99-meta.warc.gz 15923 download   job
www.foxnews.com-shallow-20171031-205711-awo99-meta.warc.os.cdx.gz 47 download
www.foxnews.com-shallow-20171031-205711-awo99.json 324 download   job
www.lifehack.org-inf-20171019-094354-4yr1a-00014.warc.gz 5391402644 download   job
www.lifehack.org-inf-20171019-094354-4yr1a-00014.warc.os.cdx.gz 2155451 download
www.lifehack.org-inf-20171019-094354-4yr1a-00015.warc.gz 5390054856 download   job
www.lifehack.org-inf-20171019-094354-4yr1a-00015.warc.os.cdx.gz 15466 download
www.lifehack.org-inf-20171019-094354-4yr1a-00016.warc.gz 5395231034 download   job
www.lifehack.org-inf-20171019-094354-4yr1a-00016.warc.os.cdx.gz 14591 download
www.lifehack.org-inf-20171019-094354-4yr1a-aborted-00017.warc.gz 1716725278 download   job
www.lifehack.org-inf-20171019-094354-4yr1a-aborted-00017.warc.os.cdx.gz 1439794 download
www.lifehack.org-inf-20171019-094354-4yr1a-aborted.json 242 download   job
www.naciodigital.cat-inf-20170919-214300-247yw-00072.warc.gz 5368717041 download   job
www.naciodigital.cat-inf-20170919-214300-247yw-00072.warc.os.cdx.gz 4498330 download
www.naciodigital.cat-inf-20170919-214300-247yw-00073.warc.gz 5368936694 download   job
www.naciodigital.cat-inf-20170919-214300-247yw-00073.warc.os.cdx.gz 5304568 download
www.reddit.com-shallow-20171031-231227-at7us-00000.warc.gz 2840852 download   job
www.reddit.com-shallow-20171031-231227-at7us-00000.warc.os.cdx.gz 10726 download
www.reddit.com-shallow-20171031-231227-at7us-meta.warc.gz 9626 download   job
www.reddit.com-shallow-20171031-231227-at7us-meta.warc.os.cdx.gz 47 download
www.reddit.com-shallow-20171031-231227-at7us.json 323 download   job
www.riuni.unisul.br-shallow-20171101-135503-bg4on-00000.warc.gz 667368 download   job
www.riuni.unisul.br-shallow-20171101-135503-bg4on-00000.warc.os.cdx.gz 297 download
www.riuni.unisul.br-shallow-20171101-135503-bg4on-meta.warc.gz 3614 download   job
www.riuni.unisul.br-shallow-20171101-135503-bg4on-meta.warc.os.cdx.gz 47 download
www.riuni.unisul.br-shallow-20171101-135503-bg4on.json 323 download   job
www.snh2013.anpuh.org-shallow-20171101-134139-eekqu-00000.warc.gz 117136 download   job
www.snh2013.anpuh.org-shallow-20171101-134139-eekqu-00000.warc.os.cdx.gz 272 download
www.snh2013.anpuh.org-shallow-20171101-134139-eekqu-meta.warc.gz 3560 download   job
www.snh2013.anpuh.org-shallow-20171101-134139-eekqu-meta.warc.os.cdx.gz 47 download
www.snh2013.anpuh.org-shallow-20171101-134139-eekqu.json 310 download   job
www.snh2017.anpuh.org-shallow-20171101-135520-bmf33-00000.warc.gz 715238 download   job
www.snh2017.anpuh.org-shallow-20171101-135520-bmf33-00000.warc.os.cdx.gz 325 download
www.snh2017.anpuh.org-shallow-20171101-135520-bmf33-meta.warc.gz 3645 download   job
www.snh2017.anpuh.org-shallow-20171101-135520-bmf33-meta.warc.os.cdx.gz 47 download
www.snh2017.anpuh.org-shallow-20171101-135520-bmf33.json 361 download   job
www.solarroadways.com-shallow-20171101-135222-yttp1-00000.warc.gz 1929877 download   job
www.solarroadways.com-shallow-20171101-135222-yttp1-00000.warc.os.cdx.gz 3645 download
www.solarroadways.com-shallow-20171101-135222-yttp1-meta.warc.gz 5652 download   job
www.solarroadways.com-shallow-20171101-135222-yttp1-meta.warc.os.cdx.gz 47 download
www.solarroadways.com-shallow-20171101-135222-yttp1.json 249 download   job
www.techdirt.com-shallow-20171101-172526-2b1zi.json 340 download   job
www.theblaze.com-shallow-20171101-035153-a7wr9-00000.warc.gz 7843791 download   job
www.theblaze.com-shallow-20171101-035153-a7wr9-00000.warc.os.cdx.gz 14220 download
www.theblaze.com-shallow-20171101-035153-a7wr9-meta.warc.gz 12259 download   job
www.theblaze.com-shallow-20171101-035153-a7wr9-meta.warc.os.cdx.gz 47 download
www.theblaze.com-shallow-20171101-035153-a7wr9.json 356 download   job
www.theguardian.com-shallow-20171101-151430-adfr1-00000.warc.gz 513191 download   job
www.theguardian.com-shallow-20171101-151430-adfr1-00000.warc.os.cdx.gz 4223 download
www.theguardian.com-shallow-20171101-151430-adfr1-meta.warc.gz 6704 download   job
www.theguardian.com-shallow-20171101-151430-adfr1-meta.warc.os.cdx.gz 47 download
www.theguardian.com-shallow-20171101-151430-adfr1.json 363 download   job
www.transparenciacatalunya.cat-inf-20171101-102233-3ml3o-00000.warc.gz 1746225435 download   job
www.transparenciacatalunya.cat-inf-20171101-102233-3ml3o-00000.warc.os.cdx.gz 2651386 download
www.transparenciacatalunya.cat-inf-20171101-102233-3ml3o-meta.warc.gz 1660134 download   job
www.transparenciacatalunya.cat-inf-20171101-102233-3ml3o-meta.warc.os.cdx.gz 47 download
www.transparenciacatalunya.cat-inf-20171101-102233-3ml3o.json 260 download   job
www.upi.com-shallow-20171031-235034-e15fv-00000.warc.gz 1569167 download   job
www.upi.com-shallow-20171031-235034-e15fv-00000.warc.os.cdx.gz 7799 download
www.upi.com-shallow-20171031-235034-e15fv-meta.warc.gz 8656 download   job
www.upi.com-shallow-20171031-235034-e15fv-meta.warc.os.cdx.gz 47 download
www.upi.com-shallow-20171031-235034-e15fv.json 362 download   job
www.wiocha.pl-inf-20171018-113215-2i2w3-00027.warc.gz 5370583467 download   job
www.wiocha.pl-inf-20171018-113215-2i2w3-00027.warc.os.cdx.gz 6727959 download
www.wiocha.pl-inf-20171018-113215-2i2w3-00028.warc.gz 5368747694 download   job
www.wiocha.pl-inf-20171018-113215-2i2w3-00028.warc.os.cdx.gz 7650383 download
www.wiocha.pl-inf-20171018-113215-2i2w3-00029.warc.gz 5368820312 download   job
www.wiocha.pl-inf-20171018-113215-2i2w3-00029.warc.os.cdx.gz 9476445 download
www1.folha.uol.com.br-shallow-20171101-125641-2zfmy-00000.warc.gz 1701762 download   job
www1.folha.uol.com.br-shallow-20171101-125641-2zfmy-00000.warc.os.cdx.gz 7638 download
www1.folha.uol.com.br-shallow-20171101-125641-2zfmy-meta.warc.gz 8741 download   job
www1.folha.uol.com.br-shallow-20171101-125641-2zfmy-meta.warc.os.cdx.gz 47 download
www1.folha.uol.com.br-shallow-20171101-125641-2zfmy.json 288 download   job
www14.gencat.cat-inf-20171101-052900-duk8w-00000.warc.gz 6625 download   job
www14.gencat.cat-inf-20171101-052900-duk8w-00000.warc.os.cdx.gz 322 download
www14.gencat.cat-inf-20171101-052900-duk8w-meta.warc.gz 3528 download   job
www14.gencat.cat-inf-20171101-052900-duk8w-meta.warc.os.cdx.gz 47 download
www14.gencat.cat-inf-20171101-052900-duk8w.json 246 download   job
www15.gencat.cat-inf-20171101-052909-e91vq-00000.warc.gz 6112 download   job
www15.gencat.cat-inf-20171101-052909-e91vq-00000.warc.os.cdx.gz 47 download
www15.gencat.cat-inf-20171101-052909-e91vq-meta.warc.gz 3653 download   job
www15.gencat.cat-inf-20171101-052909-e91vq-meta.warc.os.cdx.gz 47 download
www15.gencat.cat-inf-20171101-052909-e91vq.json 246 download   job