Item archiveteam_archivebot_go_20231002142652_43cb1d30
Filename | Size | |
---|---|---|
27.tumblr.com-inf-20230809-001840-cywaz-01929.warc.gz | 5371537015 | download job |
27.tumblr.com-inf-20230809-001840-cywaz-01929.warc.os.cdx.gz | 1400139 | download |
archiveteam_archivebot_go_20231002142652_43cb1d30.cdx.gz | 1471486 | download |
archiveteam_archivebot_go_20231002142652_43cb1d30.cdx.idx | 1275 | download |
archiveteam_archivebot_go_20231002142652_43cb1d30_files.xml | 0 | download |
archiveteam_archivebot_go_20231002142652_43cb1d30_meta.sqlite | 110592 | download |
archiveteam_archivebot_go_20231002142652_43cb1d30_meta.xml | 995 | download |
ceur-ws.org-inf-20231002-075735-awhll-00008.warc.gz | 5383950645 | download job |
ceur-ws.org-inf-20231002-075735-awhll-00008.warc.os.cdx.gz | 48163 | download |
ceur-ws.org-inf-20231002-075735-awhll-00009.warc.gz | 5387025015 | download job |
ceur-ws.org-inf-20231002-075735-awhll-00009.warc.os.cdx.gz | 56401 | download |
digitalmaine.com-inf-20230821-020801-4zf6k-01332.warc.gz | 5427244805 | download job |
digitalmaine.com-inf-20230821-020801-4zf6k-01332.warc.os.cdx.gz | 10369 | download |
digitalmaine.com-inf-20230821-020801-4zf6k-01333.warc.gz | 5433046175 | download job |
digitalmaine.com-inf-20230821-020801-4zf6k-01333.warc.os.cdx.gz | 12079 | download |
en.wikipedia.org-shallow-20231002-134242-72820-00000.warc.gz | 339921 | download job |
en.wikipedia.org-shallow-20231002-134242-72820-00000.warc.os.cdx.gz | 6048 | download |
en.wikipedia.org-shallow-20231002-134242-72820-meta.warc.gz | 6968 | download job |
en.wikipedia.org-shallow-20231002-134242-72820-meta.warc.os.cdx.gz | 47 | download |
en.wikipedia.org-shallow-20231002-134242-72820.json | 270 | download job |
en.wikipedia.org-shallow-20231002-134247-1tz1p-00000.warc.gz | 340344 | download job |
en.wikipedia.org-shallow-20231002-134247-1tz1p-00000.warc.os.cdx.gz | 6127 | download |
en.wikipedia.org-shallow-20231002-134247-1tz1p-meta.warc.gz | 7123 | download job |
en.wikipedia.org-shallow-20231002-134247-1tz1p-meta.warc.os.cdx.gz | 47 | download |
en.wikipedia.org-shallow-20231002-134247-1tz1p.json | 298 | download job |
factcheck.kg-inf-20230822-222114-1rs6h-00008.warc.gz | 5567873815 | download job |
factcheck.kg-inf-20230822-222114-1rs6h-00008.warc.os.cdx.gz | 2945056 | download |
forum.hrwiki.org-inf-20230917-095343-11syn-00018.warc.gz | 5377042831 | download job |
forum.hrwiki.org-inf-20230917-095343-11syn-00018.warc.os.cdx.gz | 2722511 | download |
git.icecoredata.org-inf-20230930-151706-esz1i-00097.warc.gz | 8886701933 | download job |
git.icecoredata.org-inf-20230930-151706-esz1i-00097.warc.os.cdx.gz | 44954 | download |
git.icecoredata.org-inf-20230930-151706-esz1i-00098.warc.gz | 8119366239 | download job |
git.icecoredata.org-inf-20230930-151706-esz1i-00098.warc.os.cdx.gz | 612 | download |
git.icecoredata.org-inf-20230930-151706-esz1i-00099.warc.gz | 8141701057 | download job |
git.icecoredata.org-inf-20230930-151706-esz1i-00099.warc.os.cdx.gz | 1285 | download |
lesobservateurs.ch-inf-20230917-113444-1v9zj-00200.warc.gz | 5374182762 | download job |
lesobservateurs.ch-inf-20230917-113444-1v9zj-00200.warc.os.cdx.gz | 1924880 | download |
unicode.scarfboy.com-inf-20230930-221059-28ocb-00000.warc.gz | 5368709292 | download job |
unicode.scarfboy.com-inf-20230930-221059-28ocb-00000.warc.os.cdx.gz | 32074273 | download |
unity.com-inf-20230914-160454-uskmn-01444.warc.gz | 6732663547 | download job |
unity.com-inf-20230914-160454-uskmn-01444.warc.os.cdx.gz | 3200 | download |
unity.com-inf-20230914-160454-uskmn-01445.warc.gz | 5377694057 | download job |
unity.com-inf-20230914-160454-uskmn-01445.warc.os.cdx.gz | 11352 | download |
valoriez.blogspot.com-inf-20231002-080848-12bsc-00001.warc.gz | 5489088650 | download job |
valoriez.blogspot.com-inf-20231002-080848-12bsc-00001.warc.os.cdx.gz | 3280342 | download |
videos.sapo.pt-inf-20230910-063253-3tg7d-00512.warc.gz | 5376752896 | download job |
videos.sapo.pt-inf-20230910-063253-3tg7d-00512.warc.os.cdx.gz | 165168 | download |
videos.sapo.pt-inf-20230910-063253-3tg7d-00513.warc.gz | 5404150081 | download job |
videos.sapo.pt-inf-20230910-063253-3tg7d-00513.warc.os.cdx.gz | 107590 | download |
www.buzzfeednews.com-inf-20230420-160602-d4rha-01851.warc.gz | 5472946963 | download job |
www.buzzfeednews.com-inf-20230420-160602-d4rha-01851.warc.os.cdx.gz | 1033250 | download |
www.harvard.com-shallow-20231002-135159-2ybdg-00000.warc.gz | 1595208 | download job |
www.harvard.com-shallow-20231002-135159-2ybdg-00000.warc.os.cdx.gz | 10253 | download |
www.harvard.com-shallow-20231002-135159-2ybdg-meta.warc.gz | 9508 | download job |
www.harvard.com-shallow-20231002-135159-2ybdg-meta.warc.os.cdx.gz | 47 | download |
www.harvard.com-shallow-20231002-135159-2ybdg.json | 279 | download job |
www.newyorker.com-shallow-20231002-134905-ell7p-00000.warc.gz | 18792947 | download job |
www.newyorker.com-shallow-20231002-134905-ell7p-00000.warc.os.cdx.gz | 27242 | download |
www.newyorker.com-shallow-20231002-134905-ell7p-meta.warc.gz | 20683 | download job |
www.newyorker.com-shallow-20231002-134905-ell7p-meta.warc.os.cdx.gz | 47 | download |
www.newyorker.com-shallow-20231002-134905-ell7p-wpull.log.gz | 17919 | download |
www.newyorker.com-shallow-20231002-134905-ell7p.json | 367 | download job |
www.nybooks.com-shallow-20231002-134724-77csm-00000.warc.gz | 126253768 | download job |
www.nybooks.com-shallow-20231002-134724-77csm-00000.warc.os.cdx.gz | 15087 | download |
www.nybooks.com-shallow-20231002-134724-77csm-meta.warc.gz | 14517 | download job |
www.nybooks.com-shallow-20231002-134724-77csm-meta.warc.os.cdx.gz | 47 | download |
www.nybooks.com-shallow-20231002-134724-77csm.json | 319 | download job |
www.nypl.org-shallow-20231002-134303-58xfa-00000.warc.gz | 444593852 | download job |
www.nypl.org-shallow-20231002-134303-58xfa-00000.warc.os.cdx.gz | 14367 | download |
www.nypl.org-shallow-20231002-134303-58xfa-meta.warc.gz | 12598 | download job |
www.nypl.org-shallow-20231002-134303-58xfa-meta.warc.os.cdx.gz | 47 | download |
www.nypl.org-shallow-20231002-134303-58xfa.json | 269 | download job |
www.nypl.org-shallow-20231002-134447-7kk0m-00000.warc.gz | 5463965 | download job |
www.nypl.org-shallow-20231002-134447-7kk0m-00000.warc.os.cdx.gz | 6522 | download |
www.nypl.org-shallow-20231002-134447-7kk0m-meta.warc.gz | 7684 | download job |
www.nypl.org-shallow-20231002-134447-7kk0m-meta.warc.os.cdx.gz | 47 | download |
www.nypl.org-shallow-20231002-134447-7kk0m.json | 297 | download job |
www.rtve.es-inf-20230807-032318-698gj-00740.warc.gz | 5368719949 | download job |
www.rtve.es-inf-20230807-032318-698gj-00740.warc.os.cdx.gz | 5971639 | download |
www.zeutschel.de-shallow-20231002-134527-dyg3g-00000.warc.gz | 2167295 | download job |
www.zeutschel.de-shallow-20231002-134527-dyg3g-00000.warc.os.cdx.gz | 2554 | download |
www.zeutschel.de-shallow-20231002-134527-dyg3g-meta.warc.gz | 5037 | download job |
www.zeutschel.de-shallow-20231002-134527-dyg3g-meta.warc.os.cdx.gz | 47 | download |
www.zeutschel.de-shallow-20231002-134527-dyg3g.json | 307 | download job |