Item archiveteam_archivebot_go_20200712150003
Filename | Size | |
---|---|---|
archiveteam_archivebot_go_20200712150003.cdx.gz | 119151924 | download |
archiveteam_archivebot_go_20200712150003.cdx.idx | 99281 | download |
archiveteam_archivebot_go_20200712150003_files.xml | 0 | download |
archiveteam_archivebot_go_20200712150003_meta.sqlite | 649216 | download |
archiveteam_archivebot_go_20200712150003_meta.xml | 969 | download |
getsatisfaction.com-inf-20200708-234031-epnla-00016.warc.gz | 5376082429 | download job |
getsatisfaction.com-inf-20200708-234031-epnla-00016.warc.os.cdx.gz | 7726503 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00131.warc.gz | 5369173598 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00131.warc.os.cdx.gz | 113861 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00132.warc.gz | 5369863897 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00132.warc.os.cdx.gz | 160724 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00133.warc.gz | 5370926302 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00133.warc.os.cdx.gz | 293829 | download |
ninjamountain.blogspot.com-inf-20200712-073150-8n97d-00002.warc.gz | 3834628441 | download job |
ninjamountain.blogspot.com-inf-20200712-073150-8n97d-00002.warc.os.cdx.gz | 3369170 | download |
ninjamountain.blogspot.com-inf-20200712-073150-8n97d-meta.warc.gz | 2701883 | download job |
ninjamountain.blogspot.com-inf-20200712-073150-8n97d-meta.warc.os.cdx.gz | 47 | download |
nu-kak-tam-s-dengami.sk8er.name-shallow-20200712-133909-c4qmt-00000.warc.gz | 1877817 | download job |
nu-kak-tam-s-dengami.sk8er.name-shallow-20200712-133909-c4qmt-00000.warc.os.cdx.gz | 6278 | download |
nu-kak-tam-s-dengami.sk8er.name-shallow-20200712-133909-c4qmt-meta.warc.gz | 7134 | download job |
nu-kak-tam-s-dengami.sk8er.name-shallow-20200712-133909-c4qmt-meta.warc.os.cdx.gz | 47 | download |
nu-kak-tam-s-dengami.sk8er.name-shallow-20200712-133909-c4qmt.json | 266 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00006.warc.gz | 5369016906 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00006.warc.os.cdx.gz | 2391316 | download |
old.reddit.com-inf-20200712-011858-coxzo-00007.warc.gz | 5556933264 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00007.warc.os.cdx.gz | 1167800 | download |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a-00000.warc.gz | 191953715 | download job |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a-00000.warc.os.cdx.gz | 186496 | download |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a-meta.warc.gz | 102367 | download job |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a-urls.txt | 50640 | download |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj-00000.warc.gz | 44068200 | download job |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj-00000.warc.os.cdx.gz | 96412 | download |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj-meta.warc.gz | 55716 | download job |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj-urls.txt | 29059 | download |
urls-archive.max.fan-twitter-@FNyusi-filtered.txt-shallow-20200712-143316-ce2zj.json | 327 | download job |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr-00000.warc.gz | 122897339 | download job |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr-00000.warc.os.cdx.gz | 148879 | download |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr-urls.txt | 79429 | download |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr.json | 335 | download job |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9-00000.warc.gz | 172893471 | download job |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9-00000.warc.os.cdx.gz | 371941 | download |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9-meta.warc.gz | 204397 | download job |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9-urls.txt | 122100 | download |
urls-archive.max.fan-twitter-@Folkhalsomynd-filtered.txt-shallow-20200712-142619-e3an9.json | 341 | download job |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl-00000.warc.gz | 76140072 | download job |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl-00000.warc.os.cdx.gz | 118969 | download |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl-meta.warc.gz | 68489 | download job |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl.json | 333 | download job |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl-00000.warc.gz | 3792030 | download job |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl-00000.warc.os.cdx.gz | 6632 | download |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl-meta.warc.gz | 7688 | download job |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl-urls.txt | 2666 | download |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin-00000.warc.gz | 27484708 | download job |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin-00000.warc.os.cdx.gz | 29266 | download |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin-meta.warc.gz | 19981 | download job |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin-urls.txt | 7283 | download |
urls-archive.max.fan-twitter-@FortLarnedNPS-filtered.txt-shallow-20200712-142528-b8fin.json | 341 | download job |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7-00000.warc.gz | 288865354 | download job |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7-00000.warc.os.cdx.gz | 666812 | download |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7-meta.warc.gz | 359020 | download job |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7-urls.txt | 78400 | download |
urls-archive.max.fan-twitter-@FrancoiseNyssen-filtered.txt-shallow-20200712-141757-e7ns7.json | 345 | download job |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr-meta.warc.gz | 106354 | download job |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr-urls.txt | 55608 | download |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr.json | 335 | download job |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx-00000.warc.gz | 168608472 | download job |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx-00000.warc.os.cdx.gz | 393858 | download |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx-meta.warc.gz | 213579 | download job |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx-urls.txt | 47550 | download |
urls-archive.max.fan-twitter-@French_Gov-filtered.txt-shallow-20200712-141449-9asbx.json | 335 | download job |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45-00000.warc.gz | 474898633 | download job |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45-00000.warc.os.cdx.gz | 610184 | download |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45-urls.txt | 333173 | download |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45.json | 339 | download job |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j-00000.warc.gz | 109238719 | download job |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j-00000.warc.os.cdx.gz | 178079 | download |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j-meta.warc.gz | 99228 | download job |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j-urls.txt | 77980 | download |
urls-archive.max.fan-twitter-@GEFI_Youth-filtered.txt-shallow-20200712-140358-9a17j.json | 335 | download job |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7-00000.warc.gz | 90515225 | download job |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7-00000.warc.os.cdx.gz | 173912 | download |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7-meta.warc.gz | 97165 | download job |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7-urls.txt | 24091 | download |
urls-archive.max.fan-twitter-@GHoungbo-filtered.txt-shallow-20200712-134957-1pxn7.json | 331 | download job |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6-00000.warc.gz | 6968088 | download job |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6-00000.warc.os.cdx.gz | 19079 | download |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6-meta.warc.gz | 14548 | download job |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6-urls.txt | 3128 | download |
urls-archive.max.fan-twitter-@GJvanBohemen-filtered.txt-shallow-20200712-133426-86ad6.json | 339 | download job |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc-00000.warc.gz | 189852402 | download job |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc-00000.warc.os.cdx.gz | 218035 | download |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc-meta.warc.gz | 120525 | download job |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc-urls.txt | 59225 | download |
urls-archive.max.fan-twitter-@GOP_PR51-filtered.txt-shallow-20200712-132347-ahpwc.json | 331 | download job |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7-00000.warc.gz | 152202137 | download job |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7-00000.warc.os.cdx.gz | 152555 | download |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7-meta.warc.gz | 84341 | download job |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7-urls.txt | 132678 | download |
urls-archive.max.fan-twitter-@GOV_BN-filtered.txt-shallow-20200712-131222-1czi7.json | 327 | download job |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj-00000.warc.gz | 120537502 | download job |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj-00000.warc.os.cdx.gz | 282134 | download |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj-meta.warc.gz | 154521 | download job |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj-urls.txt | 88884 | download |
urls-archive.max.fan-twitter-@GardinerHarris-filtered.txt-shallow-20200712-140425-5hlqj.json | 343 | download job |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx-00000.warc.gz | 47117503 | download job |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx-00000.warc.os.cdx.gz | 52601 | download |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx-meta.warc.gz | 32161 | download job |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx-urls.txt | 8990 | download |
urls-archive.max.fan-twitter-@Ghanaunmission-filtered.txt-shallow-20200712-135000-13rzx.json | 343 | download job |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj-00000.warc.gz | 281208387 | download job |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj-00000.warc.os.cdx.gz | 474896 | download |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj-meta.warc.gz | 255786 | download job |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj-urls.txt | 124499 | download |
urls-archive.max.fan-twitter-@GillFurnissMP-filtered.txt-shallow-20200712-134848-5vixj.json | 341 | download job |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu-00000.warc.gz | 678511741 | download job |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu-00000.warc.os.cdx.gz | 846625 | download |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu-meta.warc.gz | 459976 | download job |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu-urls.txt | 177354 | download |
urls-archive.max.fan-twitter-@GinettePT-filtered.txt-shallow-20200712-133758-7p8iu.json | 333 | download job |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j-00000.warc.gz | 103212063 | download job |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j-00000.warc.os.cdx.gz | 185110 | download |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j-meta.warc.gz | 103959 | download job |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j-urls.txt | 64060 | download |
urls-archive.max.fan-twitter-@GioRussonello-filtered.txt-shallow-20200712-133757-9j86j.json | 341 | download job |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i-00000.warc.gz | 239878104 | download job |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i-00000.warc.os.cdx.gz | 191136 | download |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i-meta.warc.gz | 104841 | download job |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i-urls.txt | 74540 | download |
urls-archive.max.fan-twitter-@GlennCountyOES-filtered.txt-shallow-20200712-133423-9hk7i.json | 343 | download job |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho-meta.warc.gz | 365977 | download job |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho-urls.txt | 241377 | download |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho.json | 343 | download job |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6-00000.warc.gz | 154096076 | download job |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6-00000.warc.os.cdx.gz | 209191 | download |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6-meta.warc.gz | 115284 | download job |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6-urls.txt | 94001 | download |
urls-archive.max.fan-twitter-@GoVerbWorld-filtered.txt-shallow-20200712-130350-ewbp6.json | 337 | download job |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr-00000.warc.gz | 32227056 | download job |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr-00000.warc.os.cdx.gz | 120564 | download |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr-meta.warc.gz | 68524 | download job |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr-urls.txt | 7812 | download |
urls-archive.max.fan-twitter-@GovAndyBeshear-filtered.txt-shallow-20200712-132215-38bbr.json | 343 | download job |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp-00000.warc.gz | 288470123 | download job |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp-00000.warc.os.cdx.gz | 649982 | download |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp-meta.warc.gz | 350383 | download job |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp-urls.txt | 61364 | download |
urls-archive.max.fan-twitter-@GovBillLee-filtered.txt-shallow-20200712-132214-91vxp.json | 335 | download job |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz-00000.warc.gz | 946371574 | download job |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz-00000.warc.os.cdx.gz | 1147801 | download |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz-meta.warc.gz | 615462 | download job |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz.json | 343 | download job |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1-00000.warc.gz | 116022746 | download job |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1-00000.warc.os.cdx.gz | 228828 | download |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1-meta.warc.gz | 126578 | download job |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1-urls.txt | 37878 | download |
urls-archive.max.fan-twitter-@GovDunleavy-filtered.txt-shallow-20200712-131217-j15m1.json | 337 | download job |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts-00000.warc.gz | 1173885537 | download job |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts-00000.warc.os.cdx.gz | 1561231 | download |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts-meta.warc.gz | 829198 | download job |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts-urls.txt | 277558 | download |
urls-archive.max.fan-twitter-@GovHolcomb-filtered.txt-shallow-20200712-130011-auxts.json | 335 | download job |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz-00000.warc.gz | 1100105998 | download job |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz-00000.warc.os.cdx.gz | 2785521 | download |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz-meta.warc.gz | 1491599 | download job |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz-urls.txt | 362898 | download |
urls-archive.max.fan-twitter-@GovInslee-filtered.txt-shallow-20200712-130011-5pfsz.json | 333 | download job |
urls-archive.max.fan-twitter-@GovJanetMills-filtered.txt-shallow-20200712-124425-42g5s-meta.warc.gz | 127105 | download job |
urls-archive.max.fan-twitter-@GovJanetMills-filtered.txt-shallow-20200712-124425-42g5s-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovJanetMills-filtered.txt-shallow-20200712-124425-42g5s-urls.txt | 24766 | download |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp-00000.warc.gz | 363216511 | download job |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp-00000.warc.os.cdx.gz | 776943 | download |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp-meta.warc.gz | 417751 | download job |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp-urls.txt | 79915 | download |
urls-archive.max.fan-twitter-@GovKemp-filtered.txt-shallow-20200712-124425-65gsp.json | 329 | download job |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu-00000.warc.gz | 1054855173 | download job |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu-00000.warc.os.cdx.gz | 2069133 | download |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu-meta.warc.gz | 1111564 | download job |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu-urls.txt | 295989 | download |
urls-archive.max.fan-twitter-@GovLarryHogan-filtered.txt-shallow-20200712-124423-oucxu.json | 341 | download job |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta-00000.warc.gz | 216748570 | download job |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta-00000.warc.os.cdx.gz | 505025 | download |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta-meta.warc.gz | 273653 | download job |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta-urls.txt | 59292 | download |
urls-archive.max.fan-twitter-@GovLauraKelly-filtered.txt-shallow-20200712-124422-94xta.json | 341 | download job |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly-00000.warc.gz | 421235790 | download job |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly-00000.warc.os.cdx.gz | 874679 | download |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly-meta.warc.gz | 472810 | download job |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly-urls.txt | 115560 | download |
urls-archive.max.fan-twitter-@GovMLG-filtered.txt-shallow-20200712-123448-bo5ly.json | 327 | download job |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg-meta.warc.gz | 1246810 | download job |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg-urls.txt | 435106 | download |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg.json | 339 | download job |
urls-archive.max.fan-twitter-@GovMonaco-filtered.txt-shallow-20200712-123210-4uni4-meta.warc.gz | 207502 | download job |
urls-archive.max.fan-twitter-@GovMonaco-filtered.txt-shallow-20200712-123210-4uni4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel-00000.warc.gz | 600116143 | download job |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel-00000.warc.os.cdx.gz | 1127379 | download |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel-meta.warc.gz | 609132 | download job |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel-urls.txt | 168840 | download |
urls-archive.max.fan-twitter-@GovNedLamont-filtered.txt-shallow-20200712-122431-d3kel.json | 339 | download job |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w-00000.warc.gz | 1196657987 | download job |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w-00000.warc.os.cdx.gz | 1479697 | download |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w-meta.warc.gz | 791243 | download job |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w-urls.txt | 237003 | download |
urls-archive.max.fan-twitter-@GovParsonMO-filtered.txt-shallow-20200712-122431-exz0w.json | 337 | download job |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21-00000.warc.gz | 494218103 | download job |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21-00000.warc.os.cdx.gz | 1198276 | download |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21-meta.warc.gz | 640040 | download job |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21-urls.txt | 156704 | download |
urls-archive.max.fan-twitter-@GovPritzker-filtered.txt-shallow-20200712-122428-c4j21.json | 337 | download job |
urls-archive.max.fan-twitter-@GovRicketts-filtered.txt-shallow-20200712-122426-7odqm-00000.warc.gz | 9516017 | download job |
urls-archive.max.fan-twitter-@GovRicketts-filtered.txt-shallow-20200712-122426-7odqm-00000.warc.os.cdx.gz | 32250 | download |
urls-archive.max.fan-twitter-@GovRicketts-filtered.txt-shallow-20200712-122426-7odqm-urls.txt | 1770 | download |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc-00000.warc.gz | 576898109 | download job |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc-00000.warc.os.cdx.gz | 1680407 | download |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc-meta.warc.gz | 895599 | download job |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc-urls.txt | 203156 | download |
urls-archive.max.fan-twitter-@GovRonDeSantis-filtered.txt-shallow-20200712-122209-39owc.json | 343 | download job |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb-00000.warc.gz | 828238376 | download job |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb-00000.warc.os.cdx.gz | 1253282 | download |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb-meta.warc.gz | 670117 | download job |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb-urls.txt | 165010 | download |
urls-archive.max.fan-twitter-@GovSisolak-filtered.txt-shallow-20200712-122047-3pjwb.json | 335 | download job |
urls-archive.max.fan-twitter-@GovStitt-filtered.txt-shallow-20200712-121923-bv6wv-meta.warc.gz | 395954 | download job |
urls-archive.max.fan-twitter-@GovStitt-filtered.txt-shallow-20200712-121923-bv6wv-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovStitt-filtered.txt-shallow-20200712-121923-bv6wv-urls.txt | 104935 | download |
urls-archive.max.fan-twitter-@GovStitt-filtered.txt-shallow-20200712-121923-bv6wv.json | 331 | download job |
urls-archive.max.fan-twitter-@GovTimWalz-filtered.txt-shallow-20200712-121919-69j6o-meta.warc.gz | 64926 | download job |
urls-archive.max.fan-twitter-@GovTimWalz-filtered.txt-shallow-20200712-121919-69j6o-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovTimWalz-filtered.txt-shallow-20200712-121919-69j6o-urls.txt | 5974 | download |
urls-archive.max.fan-twitter-@GovTimWalz-filtered.txt-shallow-20200712-121919-69j6o.json | 335 | download job |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1-meta.warc.gz | 1010346 | download job |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1.json | 345 | download job |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac-00000.warc.gz | 107817119 | download job |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac-00000.warc.os.cdx.gz | 192346 | download |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac-meta.warc.gz | 106656 | download job |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac-urls.txt | 32426 | download |
urls-archive.max.fan-twitter-@GovernorGordon-filtered.txt-shallow-20200712-130340-34iac.json | 343 | download job |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws-00000.warc.gz | 217791061 | download job |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws-00000.warc.os.cdx.gz | 639635 | download |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws-meta.warc.gz | 344132 | download job |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws-urls.txt | 84471 | download |
urls-archive.max.fan-twitter-@GovernorPataki-filtered.txt-shallow-20200712-130012-3y6ws.json | 343 | download job |
urls-archive.max.fan-twitter-@GreatSmokyNPS-filtered.txt-shallow-20200712-121810-avjdi-urls.txt | 109804 | download |
urls-archive.max.fan-twitter-@GreenfieldIowa-filtered.txt-shallow-20200712-121805-9jg08-00000.warc.gz | 242983230 | download job |
urls-archive.max.fan-twitter-@GreenfieldIowa-filtered.txt-shallow-20200712-121805-9jg08-00000.warc.os.cdx.gz | 491456 | download |
urls-archive.max.fan-twitter-@GreenfieldIowa-filtered.txt-shallow-20200712-121805-9jg08-meta.warc.gz | 265696 | download job |
urls-archive.max.fan-twitter-@GreenfieldIowa-filtered.txt-shallow-20200712-121805-9jg08-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GuilfordNPS-filtered.txt-shallow-20200712-121122-90smz-meta.warc.gz | 38895 | download job |
urls-archive.max.fan-twitter-@GuilfordNPS-filtered.txt-shallow-20200712-121122-90smz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GuilfordNPS-filtered.txt-shallow-20200712-121122-90smz.json | 337 | download job |
urls-archive.max.fan-twitter-@GuldenTC-filtered.txt-shallow-20200712-121118-dgz29-00000.warc.gz | 93012637 | download job |
urls-archive.max.fan-twitter-@GuldenTC-filtered.txt-shallow-20200712-121118-dgz29-00000.warc.os.cdx.gz | 146225 | download |
urls-archive.max.fan-twitter-@GuldenTC-filtered.txt-shallow-20200712-121118-dgz29-urls.txt | 26224 | download |
urls-archive.max.fan-twitter-@GuldenTC-filtered.txt-shallow-20200712-121118-dgz29.json | 331 | download job |
urls-archive.max.fan-twitter-@GulfIslandsNPS-filtered.txt-shallow-20200712-121030-78g87-00000.warc.gz | 100216187 | download job |
urls-archive.max.fan-twitter-@GulfIslandsNPS-filtered.txt-shallow-20200712-121030-78g87-00000.warc.os.cdx.gz | 118680 | download |
urls-archive.max.fan-twitter-@GulfIslandsNPS-filtered.txt-shallow-20200712-121030-78g87-meta.warc.gz | 67477 | download job |
urls-archive.max.fan-twitter-@GulfIslandsNPS-filtered.txt-shallow-20200712-121030-78g87-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GusForCongress-filtered.txt-shallow-20200712-121025-er9d8.json | 343 | download job |
urls-archive.max.fan-twitter-@GutoAberconwy-filtered.txt-shallow-20200712-121026-2a7rb-meta.warc.gz | 25194 | download job |
urls-archive.max.fan-twitter-@GutoAberconwy-filtered.txt-shallow-20200712-121026-2a7rb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GutoAberconwy-filtered.txt-shallow-20200712-121026-2a7rb-urls.txt | 14656 | download |
urls-archive.max.fan-twitter-@GuvernulRMD-filtered.txt-shallow-20200712-121024-88ihm.json | 337 | download job |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj-00000.warc.gz | 1460562486 | download job |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj-00000.warc.os.cdx.gz | 2460506 | download |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj-meta.warc.gz | 1307175 | download job |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj-urls.txt | 869678 | download |
urls-archive.max.fan-twitter-@HamdoDelic-filtered.txt-shallow-20200712-120833-7e1zj.json | 335 | download job |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd-00000.warc.gz | 1930777532 | download job |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd-00000.warc.os.cdx.gz | 2440221 | download |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd-meta.warc.gz | 1313065 | download job |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd-urls.txt | 405865 | download |
urls-archive.max.fan-twitter-@HarjitSajjan-filtered.txt-shallow-20200712-120621-2pacd.json | 339 | download job |
urls-archive.max.fan-twitter-@HassanAmmar5-filtered.txt-shallow-20200712-120458-9op6a-meta.warc.gz | 14723 | download job |
urls-archive.max.fan-twitter-@HassanAmmar5-filtered.txt-shallow-20200712-120458-9op6a-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HassanAmmar5-filtered.txt-shallow-20200712-120458-9op6a.json | 339 | download job |
urls-archive.max.fan-twitter-@HawleyMO-filtered.txt-shallow-20200712-120455-dngpi-meta.warc.gz | 91179 | download job |
urls-archive.max.fan-twitter-@HawleyMO-filtered.txt-shallow-20200712-120455-dngpi-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HawleyMO-filtered.txt-shallow-20200712-120455-dngpi.json | 331 | download job |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q-00000.warc.gz | 943320441 | download job |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q-00000.warc.os.cdx.gz | 2486785 | download |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q-meta.warc.gz | 1305725 | download job |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q-urls.txt | 342411 | download |
urls-archive.max.fan-twitter-@HeForShe-filtered.txt-shallow-20200712-115614-5vy0q.json | 331 | download job |
urls-archive.max.fan-twitter-@HeadUNDRR-filtered.txt-shallow-20200712-115621-eyqba-meta.warc.gz | 136446 | download job |
urls-archive.max.fan-twitter-@HeadUNDRR-filtered.txt-shallow-20200712-115621-eyqba-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HeadUNDRR-filtered.txt-shallow-20200712-115621-eyqba-urls.txt | 39350 | download |
urls-archive.max.fan-twitter-@HenrySternCA-filtered.txt-shallow-20200712-115121-4hzvy-meta.warc.gz | 193563 | download job |
urls-archive.max.fan-twitter-@HenrySternCA-filtered.txt-shallow-20200712-115121-4hzvy-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HenrySternCA-filtered.txt-shallow-20200712-115121-4hzvy.json | 339 | download job |
urls-archive.max.fan-twitter-@Hickenlooper-filtered.txt-shallow-20200712-114932-361xh-00000.warc.gz | 138452776 | download job |
urls-archive.max.fan-twitter-@Hickenlooper-filtered.txt-shallow-20200712-114932-361xh-00000.warc.os.cdx.gz | 442976 | download |
urls-archive.max.fan-twitter-@Hickenlooper-filtered.txt-shallow-20200712-114932-361xh-meta.warc.gz | 239506 | download job |
urls-archive.max.fan-twitter-@Hickenlooper-filtered.txt-shallow-20200712-114932-361xh-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Hickenlooper-filtered.txt-shallow-20200712-114932-361xh.json | 339 | download job |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj-00000.warc.gz | 1600033018 | download job |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj-00000.warc.os.cdx.gz | 2115964 | download |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj-meta.warc.gz | 1138857 | download job |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj-urls.txt | 364994 | download |
urls-archive.max.fan-twitter-@HonAhmedHussen-filtered.txt-shallow-20200712-113830-8rwlj.json | 343 | download job |
urls-archive.max.fan-twitter-@IAF_MCC-filtered.txt-shallow-20200712-111413-cpcju-00000.warc.gz | 999581916 | download job |
urls-archive.max.fan-twitter-@IAF_MCC-filtered.txt-shallow-20200712-111413-cpcju-00000.warc.os.cdx.gz | 1998136 | download |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1-00000.warc.gz | 2548725155 | download job |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1-00000.warc.os.cdx.gz | 4066462 | download |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1-meta.warc.gz | 2174292 | download job |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1-urls.txt | 965310 | download |
urls-archive.max.fan-twitter-@IRENA-filtered.txt-shallow-20200712-100412-1shl1.json | 325 | download job |
urls-archive.max.fan-twitter-@Iam_BrookeSmith-filtered.txt-shallow-20200712-111319-a4yux-00000.warc.gz | 634870809 | download job |
urls-archive.max.fan-twitter-@Iam_BrookeSmith-filtered.txt-shallow-20200712-111319-a4yux-00000.warc.os.cdx.gz | 1142014 | download |
urls-archive.max.fan-twitter-@Iam_BrookeSmith-filtered.txt-shallow-20200712-111319-a4yux-meta.warc.gz | 605148 | download job |
urls-archive.max.fan-twitter-@Iam_BrookeSmith-filtered.txt-shallow-20200712-111319-a4yux-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Iam_BrookeSmith-filtered.txt-shallow-20200712-111319-a4yux.json | 345 | download job |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m-00000.warc.gz | 924469764 | download job |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m-00000.warc.os.cdx.gz | 2819349 | download |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m-meta.warc.gz | 1480869 | download job |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m-urls.txt | 239628 | download |
urls-archive.max.fan-twitter-@IkerCasillas-filtered.txt-shallow-20200712-105943-it30m.json | 339 | download job |
urls-archive.max.fan-twitter-@IndyMayorJoe-filtered.txt-shallow-20200712-102115-60jx3-00000.warc.gz | 2794212954 | download job |
urls-archive.max.fan-twitter-@IndyMayorJoe-filtered.txt-shallow-20200712-102115-60jx3-00000.warc.os.cdx.gz | 2216035 | download |
urls-archive.max.fan-twitter-@IndyMayorJoe-filtered.txt-shallow-20200712-102115-60jx3-meta.warc.gz | 1154469 | download job |
urls-archive.max.fan-twitter-@IndyMayorJoe-filtered.txt-shallow-20200712-102115-60jx3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@IndyMayorJoe-filtered.txt-shallow-20200712-102115-60jx3-urls.txt | 458954 | download |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l-00000.warc.gz | 97463477 | download job |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l-00000.warc.os.cdx.gz | 138379 | download |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l-meta.warc.gz | 77969 | download job |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l-urls.txt | 49490 | download |
urls-archive.max.fan-twitter-@fininquiry-filtered.txt-shallow-20200712-144856-2cx7l.json | 335 | download job |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p-00000.warc.gz | 122340307 | download job |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p-00000.warc.os.cdx.gz | 168735 | download |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p-urls.txt | 86468 | download |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p.json | 335 | download job |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq-00000.warc.gz | 11848451 | download job |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq-00000.warc.os.cdx.gz | 19104 | download |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq-meta.warc.gz | 14643 | download job |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq-urls.txt | 6313 | download |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc-00000.warc.gz | 13278112 | download job |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc-00000.warc.os.cdx.gz | 28497 | download |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc-meta.warc.gz | 19539 | download job |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc-urls.txt | 5461 | download |
urls-archive.max.fan-twitter-@fu_claire-filtered.txt-shallow-20200712-141245-d8vhc.json | 333 | download job |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht-00000.warc.gz | 57116871 | download job |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht-00000.warc.os.cdx.gz | 74669 | download |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht-meta.warc.gz | 44547 | download job |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht.json | 345 | download job |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj-00000.warc.gz | 383581027 | download job |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj-00000.warc.os.cdx.gz | 963458 | download |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj-meta.warc.gz | 523242 | download job |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj-urls.txt | 173489 | download |
urls-archive.max.fan-twitter-@galendruke-filtered.txt-shallow-20200712-140754-3t1yj.json | 335 | download job |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu-00000.warc.gz | 52540380 | download job |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu-00000.warc.os.cdx.gz | 106327 | download |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu-meta.warc.gz | 61520 | download job |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu-urls.txt | 46999 | download |
urls-archive.max.fan-twitter-@garcia_alexndra-filtered.txt-shallow-20200712-140753-1a7fu.json | 345 | download job |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y-00000.warc.gz | 46246513 | download job |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y-00000.warc.os.cdx.gz | 71500 | download |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y-meta.warc.gz | 42375 | download job |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y-urls.txt | 39012 | download |
urls-archive.max.fan-twitter-@geoffmulvihill-filtered.txt-shallow-20200712-135509-3lb4y.json | 343 | download job |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs-00000.warc.gz | 83142910 | download job |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs-00000.warc.os.cdx.gz | 111800 | download |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs-meta.warc.gz | 63904 | download job |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs-urls.txt | 71529 | download |
urls-archive.max.fan-twitter-@georgehenryAP-filtered.txt-shallow-20200712-135309-qdwzs.json | 341 | download job |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a-00000.warc.gz | 11837364 | download job |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a-00000.warc.os.cdx.gz | 26574 | download |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a-meta.warc.gz | 18641 | download job |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a-urls.txt | 7699 | download |
urls-archive.max.fan-twitter-@gerrymandr-filtered.txt-shallow-20200712-135308-ci18a.json | 335 | download job |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae-00000.warc.gz | 137003095 | download job |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae-00000.warc.os.cdx.gz | 183944 | download |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae-meta.warc.gz | 101578 | download job |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae.json | 331 | download job |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc-00000.warc.gz | 335952952 | download job |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc-00000.warc.os.cdx.gz | 695264 | download |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc-meta.warc.gz | 372823 | download job |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc-urls.txt | 240699 | download |
urls-archive.max.fan-twitter-@gillianwong-filtered.txt-shallow-20200712-134806-b3sdc.json | 337 | download job |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t-00000.warc.gz | 34821923 | download job |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t-00000.warc.os.cdx.gz | 96704 | download |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t-meta.warc.gz | 55576 | download job |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t-urls.txt | 10620 | download |
urls-archive.max.fan-twitter-@gillibrandny-filtered.txt-shallow-20200712-134801-3u02t.json | 339 | download job |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3-00000.warc.gz | 4704065 | download job |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3-00000.warc.os.cdx.gz | 7644 | download |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3-meta.warc.gz | 8221 | download job |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3-urls.txt | 2050 | download |
urls-archive.max.fan-twitter-@gitadaneshjoo-filtered.txt-shallow-20200712-133712-bewv3.json | 341 | download job |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi-00000.warc.gz | 49948552 | download job |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi-00000.warc.os.cdx.gz | 55848 | download |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi-meta.warc.gz | 34055 | download job |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi-urls.txt | 18412 | download |
urls-archive.max.fan-twitter-@giveawayindia-filtered.txt-shallow-20200712-133711-cmxxi.json | 341 | download job |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4-urls.txt | 307426 | download |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4.json | 333 | download job |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek-00000.warc.gz | 2050657 | download job |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek-00000.warc.os.cdx.gz | 4858 | download |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek-meta.warc.gz | 6556 | download job |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek-urls.txt | 112 | download |
urls-archive.max.fan-twitter-@goChoate-filtered.txt-shallow-20200712-132828-crpek.json | 331 | download job |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k-00000.warc.gz | 856912931 | download job |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k-00000.warc.os.cdx.gz | 1032624 | download |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k-urls.txt | 212829 | download |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k.json | 325 | download job |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp-00000.warc.gz | 231131070 | download job |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp-00000.warc.os.cdx.gz | 250561 | download |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp-meta.warc.gz | 134944 | download job |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp-urls.txt | 168341 | download |
urls-archive.max.fan-twitter-@gophawaii-filtered.txt-shallow-20200712-132350-cougp.json | 333 | download job |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi-00000.warc.gz | 129271291 | download job |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi-00000.warc.os.cdx.gz | 149466 | download |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi-meta.warc.gz | 83886 | download job |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi-urls.txt | 45058 | download |
urls-archive.max.fan-twitter-@gouv_lu-filtered.txt-shallow-20200712-132219-21ewi.json | 329 | download job |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18-00000.warc.gz | 103683352 | download job |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18-00000.warc.os.cdx.gz | 356133 | download |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18-meta.warc.gz | 192815 | download job |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18-urls.txt | 29884 | download |
urls-archive.max.fan-twitter-@gouvernementFR-filtered.txt-shallow-20200712-132220-a4q18.json | 343 | download job |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4-00000.warc.gz | 19597608 | download job |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4-00000.warc.os.cdx.gz | 33499 | download |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4-meta.warc.gz | 22159 | download job |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4-urls.txt | 4312 | download |
urls-archive.max.fan-twitter-@govbryan-filtered.txt-shallow-20200712-131221-bamu4.json | 331 | download job |
urls-archive.max.fan-twitter-@grace4congress-filtered.txt-shallow-20200712-121810-9xbqs-00000.warc.gz | 9870493 | download job |
urls-archive.max.fan-twitter-@grace4congress-filtered.txt-shallow-20200712-121810-9xbqs-00000.warc.os.cdx.gz | 17803 | download |
urls-archive.max.fan-twitter-@grace4congress-filtered.txt-shallow-20200712-121810-9xbqs-urls.txt | 6771 | download |
urls-archive.max.fan-twitter-@greg_rastoul-filtered.txt-shallow-20200712-121645-5a0hq-00000.warc.gz | 10392008 | download job |
urls-archive.max.fan-twitter-@greg_rastoul-filtered.txt-shallow-20200712-121645-5a0hq-00000.warc.os.cdx.gz | 18038 | download |
urls-archive.max.fan-twitter-@greg_rastoul-filtered.txt-shallow-20200712-121645-5a0hq-meta.warc.gz | 14060 | download job |
urls-archive.max.fan-twitter-@greg_rastoul-filtered.txt-shallow-20200712-121645-5a0hq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@gretchenwhitmer-filtered.txt-shallow-20200712-121644-736ds-00000.warc.gz | 22262869 | download job |
urls-archive.max.fan-twitter-@gretchenwhitmer-filtered.txt-shallow-20200712-121644-736ds-00000.warc.os.cdx.gz | 93641 | download |
urls-archive.max.fan-twitter-@gretchenwhitmer-filtered.txt-shallow-20200712-121644-736ds.json | 345 | download job |
urls-archive.max.fan-twitter-@gwfost-filtered.txt-shallow-20200712-120839-98o1t-urls.txt | 62354 | download |
urls-archive.max.fan-twitter-@haeyoun-filtered.txt-shallow-20200712-120838-9bt6z-urls.txt | 4056 | download |
urls-archive.max.fan-twitter-@hani_mohamd-filtered.txt-shallow-20200712-120622-b0zvq-00000.warc.gz | 3299974 | download job |
urls-archive.max.fan-twitter-@hani_mohamd-filtered.txt-shallow-20200712-120622-b0zvq-00000.warc.os.cdx.gz | 7553 | download |
urls-archive.max.fan-twitter-@heislerphoto-filtered.txt-shallow-20200712-115452-e0wsl-00000.warc.gz | 76988083 | download job |
urls-archive.max.fan-twitter-@heislerphoto-filtered.txt-shallow-20200712-115452-e0wsl-00000.warc.os.cdx.gz | 178117 | download |
urls-archive.max.fan-twitter-@heislerphoto-filtered.txt-shallow-20200712-115452-e0wsl.json | 339 | download job |
urls-archive.max.fan-twitter-@henryfountain-filtered.txt-shallow-20200712-115123-2j36z-urls.txt | 211459 | download |
urls-archive.max.fan-twitter-@herbertnyt-filtered.txt-shallow-20200712-115120-erfnj-urls.txt | 149483 | download |
urls-archive.max.fan-twitter-@hkpoliceforce-filtered.txt-shallow-20200712-114318-86hbg-urls.txt | 161650 | download |
urls-archive.max.fan-twitter-@hkpoliceforce-filtered.txt-shallow-20200712-114318-86hbg.json | 341 | download job |
urls-archive.max.fan-twitter-@indiannavy-filtered.txt-shallow-20200712-102836-j3xjr-meta.warc.gz | 1484210 | download job |
urls-archive.max.fan-twitter-@indiannavy-filtered.txt-shallow-20200712-102836-j3xjr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-00000.warc.gz | 5368748932 | download job |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-00000.warc.os.cdx.gz | 7323983 | download |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-00001.warc.gz | 980811359 | download job |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-00001.warc.os.cdx.gz | 5957642 | download |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-meta.warc.gz | 6977103 | download job |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu-urls.txt | 4268685 | download |
urls-archive.max.fan-twitter-@jmartNYT-filtered.txt-shallow-20200712-065936-2zsdu.json | 331 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00205.warc.gz | 5447125709 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00205.warc.os.cdx.gz | 1265853 | download |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00206.warc.gz | 5584224618 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00206.warc.os.cdx.gz | 10042 | download |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00207.warc.gz | 5396534949 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00207.warc.os.cdx.gz | 16573 | download |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00208.warc.gz | 5709633277 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00208.warc.os.cdx.gz | 13199 | download |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00209.warc.gz | 5407521800 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00209.warc.os.cdx.gz | 11184 | download |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00127.warc.gz | 5415011958 | download job |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00127.warc.os.cdx.gz | 1909935 | download |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00128.warc.gz | 5473335568 | download job |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00128.warc.os.cdx.gz | 2162029 | download |
urls-transfer.notkiska.pw-twitter-%23qanon-shallow-20200531-053932-8yw79-00077.warc.gz | 5369777558 | download job |
urls-transfer.notkiska.pw-twitter-%23qanon-shallow-20200531-053932-8yw79-00077.warc.os.cdx.gz | 2646096 | download |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00080.warc.gz | 5369490481 | download job |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00080.warc.os.cdx.gz | 492557 | download |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00081.warc.gz | 5395262139 | download job |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00081.warc.os.cdx.gz | 537160 | download |
www.mathway.com-inf-20200610-011458-6sruz-00022.warc.gz | 5368711928 | download job |
www.mathway.com-inf-20200610-011458-6sruz-00022.warc.os.cdx.gz | 21394225 | download |
www.mudcrutch.com-inf-20200710-231811-ablr0-00006.warc.gz | 6232966123 | download job |
www.mudcrutch.com-inf-20200710-231811-ablr0-00006.warc.os.cdx.gz | 203524 | download |
www.mudcrutch.com-inf-20200710-231811-ablr0-00007.warc.gz | 5426757287 | download job |
www.mudcrutch.com-inf-20200710-231811-ablr0-00007.warc.os.cdx.gz | 522387 | download |
www.notcot.com-inf-20200709-213423-116f3-00021.warc.gz | 5370482185 | download job |
www.notcot.com-inf-20200709-213423-116f3-00021.warc.os.cdx.gz | 2931267 | download |
www.qiagen.com-inf-20200621-061202-1wax4-00027.warc.gz | 5369661260 | download job |
www.qiagen.com-inf-20200621-061202-1wax4-00027.warc.os.cdx.gz | 3740234 | download |
www.raspberrypi.org-inf-20200707-192424-bv6p7-00029.warc.gz | 5369159295 | download job |
www.raspberrypi.org-inf-20200707-192424-bv6p7-00029.warc.os.cdx.gz | 2111874 | download |