Item archiveteam_archivebot_go_20200712180003
Filename | Size | |
---|---|---|
archive.max.fan-shallow-20200712-174408-c5tot.json | 313 | download job |
archiveteam_archivebot_go_20200712180003.cdx.gz | 133772214 | download |
archiveteam_archivebot_go_20200712180003.cdx.idx | 113960 | download |
archiveteam_archivebot_go_20200712180003_files.xml | 0 | download |
archiveteam_archivebot_go_20200712180003_meta.sqlite | 871424 | download |
archiveteam_archivebot_go_20200712180003_meta.xml | 969 | download |
dyverscampaign.blogspot.com-inf-20200711-230125-6y293-00002.warc.gz | 1181154501 | download job |
dyverscampaign.blogspot.com-inf-20200711-230125-6y293-00002.warc.os.cdx.gz | 1104170 | download |
dyverscampaign.blogspot.com-inf-20200711-230125-6y293-meta.warc.gz | 6630760 | download job |
dyverscampaign.blogspot.com-inf-20200711-230125-6y293-meta.warc.os.cdx.gz | 47 | download |
dyverscampaign.blogspot.com-inf-20200711-230125-6y293.json | 252 | download job |
jabberworld.info-inf-20200710-221357-8fkir-00000.warc.gz | 2743598960 | download job |
jabberworld.info-inf-20200710-221357-8fkir-00000.warc.os.cdx.gz | 6332363 | download |
jabberworld.info-inf-20200710-221357-8fkir-meta.warc.gz | 5880438 | download job |
jabberworld.info-inf-20200710-221357-8fkir-meta.warc.os.cdx.gz | 47 | download |
jabberworld.info-inf-20200710-221357-8fkir.json | 240 | download job |
listserv.uoguelph.ca-inf-20200703-132747-21hfh-00008.warc.gz | 5368721237 | download job |
listserv.uoguelph.ca-inf-20200703-132747-21hfh-00008.warc.os.cdx.gz | 9684989 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00134.warc.gz | 5639538525 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00134.warc.os.cdx.gz | 139939 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00135.warc.gz | 6124406470 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00135.warc.os.cdx.gz | 6820 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00136.warc.gz | 5522990578 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00136.warc.os.cdx.gz | 18331 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00138.warc.gz | 5369910775 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00138.warc.os.cdx.gz | 22495 | download |
ninjamountain.blogspot.com-inf-20200712-073150-8n97d.json | 251 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00008.warc.gz | 5612581219 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00008.warc.os.cdx.gz | 321868 | download |
old.reddit.com-inf-20200712-011858-coxzo-00009.warc.gz | 5895462370 | download job |
old.reddit.com-inf-20200712-011858-coxzo-00009.warc.os.cdx.gz | 57956 | download |
old.reddit.com-inf-20200712-011858-coxzo-meta.warc.gz | 11109044 | download job |
old.reddit.com-inf-20200712-011858-coxzo-meta.warc.os.cdx.gz | 47 | download |
player.fm-inf-20200501-233943-6recr-00688.warc.gz | 5464868530 | download job |
player.fm-inf-20200501-233943-6recr-00688.warc.os.cdx.gz | 505565 | download |
up.frubar.net-shallow-20200712-154223-4e7xt-00000.warc.gz | 120681 | download job |
up.frubar.net-shallow-20200712-154223-4e7xt-00000.warc.os.cdx.gz | 233 | download |
up.frubar.net-shallow-20200712-154223-4e7xt-meta.warc.gz | 3471 | download job |
up.frubar.net-shallow-20200712-154223-4e7xt-meta.warc.os.cdx.gz | 47 | download |
up.frubar.net-shallow-20200712-154223-4e7xt.json | 265 | download job |
urls-archive.max.fan-twitter-@CRHFootball-filtered.txt-shallow-20200712-173006-2mkej-urls.txt | 354 | download |
urls-archive.max.fan-twitter-@CRHFootball-filtered.txt-shallow-20200712-173006-2mkej.json | 337 | download job |
urls-archive.max.fan-twitter-@CRefugeeCouncil-filtered.txt-shallow-20200712-173010-amfh0-meta.warc.gz | 23626 | download job |
urls-archive.max.fan-twitter-@CRefugeeCouncil-filtered.txt-shallow-20200712-173010-amfh0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@CVNPmtb-filtered.txt-shallow-20200712-171830-7704o-meta.warc.gz | 60179 | download job |
urls-archive.max.fan-twitter-@CVNPmtb-filtered.txt-shallow-20200712-171830-7704o-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@CVNPmtb-filtered.txt-shallow-20200712-171830-7704o-urls.txt | 51674 | download |
urls-archive.max.fan-twitter-@CVNPmtb-filtered.txt-shallow-20200712-171830-7704o.json | 329 | download job |
urls-archive.max.fan-twitter-@ColumbusGov-filtered.txt-shallow-20200712-174931-58aix-00000.warc.gz | 8974074 | download job |
urls-archive.max.fan-twitter-@ColumbusGov-filtered.txt-shallow-20200712-174931-58aix-00000.warc.os.cdx.gz | 32392 | download |
urls-archive.max.fan-twitter-@ColumbusGov-filtered.txt-shallow-20200712-174931-58aix-meta.warc.gz | 21458 | download job |
urls-archive.max.fan-twitter-@ColumbusGov-filtered.txt-shallow-20200712-174931-58aix-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@CongressmanHice-filtered.txt-shallow-20200712-174810-69zzt-00000.warc.gz | 5194737 | download job |
urls-archive.max.fan-twitter-@CongressmanHice-filtered.txt-shallow-20200712-174810-69zzt-00000.warc.os.cdx.gz | 22880 | download |
urls-archive.max.fan-twitter-@CongressmanHice-filtered.txt-shallow-20200712-174810-69zzt.json | 345 | download job |
urls-archive.max.fan-twitter-@CongressmanJVD-filtered.txt-shallow-20200712-174803-84njj-00000.warc.gz | 2612821 | download job |
urls-archive.max.fan-twitter-@CongressmanJVD-filtered.txt-shallow-20200712-174803-84njj-00000.warc.os.cdx.gz | 10137 | download |
urls-archive.max.fan-twitter-@CongressmanJVD-filtered.txt-shallow-20200712-174803-84njj-urls.txt | 310 | download |
urls-archive.max.fan-twitter-@CotedivoireOnu-filtered.txt-shallow-20200712-174012-2tyzh-meta.warc.gz | 70446 | download job |
urls-archive.max.fan-twitter-@CotedivoireOnu-filtered.txt-shallow-20200712-174012-2tyzh-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@CotedivoireOnu-filtered.txt-shallow-20200712-174012-2tyzh-urls.txt | 28494 | download |
urls-archive.max.fan-twitter-@CountyofButte-filtered.txt-shallow-20200712-173528-axiu4-00000.warc.gz | 232233148 | download job |
urls-archive.max.fan-twitter-@CountyofButte-filtered.txt-shallow-20200712-173528-axiu4-00000.warc.os.cdx.gz | 362551 | download |
urls-archive.max.fan-twitter-@Crystalpearlco-filtered.txt-shallow-20200712-172441-5vb1v-meta.warc.gz | 52197 | download job |
urls-archive.max.fan-twitter-@Crystalpearlco-filtered.txt-shallow-20200712-172441-5vb1v-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Crystalpearlco-filtered.txt-shallow-20200712-172441-5vb1v.json | 343 | download job |
urls-archive.max.fan-twitter-@CzechMFA-filtered.txt-shallow-20200712-171823-2fx71-urls.txt | 76378 | download |
urls-archive.max.fan-twitter-@DCLegalHackers-filtered.txt-shallow-20200712-170348-aszyz-meta.warc.gz | 80928 | download job |
urls-archive.max.fan-twitter-@DCLegalHackers-filtered.txt-shallow-20200712-170348-aszyz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DCLegalHackers-filtered.txt-shallow-20200712-170348-aszyz-urls.txt | 59707 | download |
urls-archive.max.fan-twitter-@DCLegalHackers-filtered.txt-shallow-20200712-170348-aszyz.json | 343 | download job |
urls-archive.max.fan-twitter-@DFATVic-filtered.txt-shallow-20200712-165359-30bxe-00000.warc.gz | 121167332 | download job |
urls-archive.max.fan-twitter-@DFATVic-filtered.txt-shallow-20200712-165359-30bxe-00000.warc.os.cdx.gz | 122595 | download |
urls-archive.max.fan-twitter-@DHS_Wolf-filtered.txt-shallow-20200712-165111-dtw1p-urls.txt | 28896 | download |
urls-archive.max.fan-twitter-@DHS_Wolf-filtered.txt-shallow-20200712-165111-dtw1p.json | 331 | download job |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr-00000.warc.gz | 265417761 | download job |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr-00000.warc.os.cdx.gz | 370050 | download |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr-meta.warc.gz | 204110 | download job |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr-urls.txt | 79063 | download |
urls-archive.max.fan-twitter-@DLeBlancNB-filtered.txt-shallow-20200712-162937-7fbpr.json | 335 | download job |
urls-archive.max.fan-twitter-@DMercer00-filtered.txt-shallow-20200712-162927-9dild.json | 333 | download job |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix-00000.warc.gz | 8713122 | download job |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix-00000.warc.os.cdx.gz | 45790 | download |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix-meta.warc.gz | 28623 | download job |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix-urls.txt | 2969 | download |
urls-archive.max.fan-twitter-@DSChazelle-filtered.txt-shallow-20200712-162506-cqwix.json | 335 | download job |
urls-archive.max.fan-twitter-@DailyDevelopmt-filtered.txt-shallow-20200712-171820-12lsj-00000.warc.gz | 52109586 | download job |
urls-archive.max.fan-twitter-@DailyDevelopmt-filtered.txt-shallow-20200712-171820-12lsj-00000.warc.os.cdx.gz | 46512 | download |
urls-archive.max.fan-twitter-@DailyDevelopmt-filtered.txt-shallow-20200712-171820-12lsj-urls.txt | 26718 | download |
urls-archive.max.fan-twitter-@DailyDevelopmt-filtered.txt-shallow-20200712-171820-12lsj.json | 343 | download job |
urls-archive.max.fan-twitter-@Danielle_4PA-filtered.txt-shallow-20200712-171337-8it80-urls.txt | 66685 | download |
urls-archive.max.fan-twitter-@DannyFaure-filtered.txt-shallow-20200712-171335-asbot.json | 335 | download job |
urls-archive.max.fan-twitter-@Data4SDGs-filtered.txt-shallow-20200712-170916-9i0bh-00000.warc.gz | 365079525 | download job |
urls-archive.max.fan-twitter-@Data4SDGs-filtered.txt-shallow-20200712-170916-9i0bh-00000.warc.os.cdx.gz | 592008 | download |
urls-archive.max.fan-twitter-@Data4SDGs-filtered.txt-shallow-20200712-170916-9i0bh-meta.warc.gz | 318624 | download job |
urls-archive.max.fan-twitter-@Data4SDGs-filtered.txt-shallow-20200712-170916-9i0bh-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Data4SDGs-filtered.txt-shallow-20200712-170916-9i0bh-urls.txt | 147624 | download |
urls-archive.max.fan-twitter-@DavidFurstNYT-filtered.txt-shallow-20200712-170515-8se45-urls.txt | 40320 | download |
urls-archive.max.fan-twitter-@DavidPorter_AP-filtered.txt-shallow-20200712-170509-9dosg-urls.txt | 51223 | download |
urls-archive.max.fan-twitter-@DavidPorter_AP-filtered.txt-shallow-20200712-170509-9dosg.json | 343 | download job |
urls-archive.max.fan-twitter-@DayemiFdn-filtered.txt-shallow-20200712-170355-2n6k6-urls.txt | 10081 | download |
urls-archive.max.fan-twitter-@DeWineHustedOH-filtered.txt-shallow-20200712-165403-2jp00-urls.txt | 50578 | download |
urls-archive.max.fan-twitter-@DeWineHustedOH-filtered.txt-shallow-20200712-165403-2jp00.json | 343 | download job |
urls-archive.max.fan-twitter-@DelaCruzMusalem-filtered.txt-shallow-20200712-165839-bceef-00000.warc.gz | 74342803 | download job |
urls-archive.max.fan-twitter-@DelaCruzMusalem-filtered.txt-shallow-20200712-165839-bceef-00000.warc.os.cdx.gz | 115801 | download |
urls-archive.max.fan-twitter-@DelaCruzMusalem-filtered.txt-shallow-20200712-165839-bceef-meta.warc.gz | 65371 | download job |
urls-archive.max.fan-twitter-@DelaCruzMusalem-filtered.txt-shallow-20200712-165839-bceef-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DiLebouthillier-filtered.txt-shallow-20200712-164411-aro57-00000.warc.gz | 550181223 | download job |
urls-archive.max.fan-twitter-@DiLebouthillier-filtered.txt-shallow-20200712-164411-aro57-00000.warc.os.cdx.gz | 556166 | download |
urls-archive.max.fan-twitter-@DiazCanelB-filtered.txt-shallow-20200712-165110-cebwu-urls.txt | 17632 | download |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo-00000.warc.gz | 16242862 | download job |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo-00000.warc.os.cdx.gz | 22280 | download |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo-meta.warc.gz | 16503 | download job |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo-urls.txt | 12602 | download |
urls-archive.max.fan-twitter-@DienMagno-filtered.txt-shallow-20200712-164936-1yxuo.json | 333 | download job |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8-00000.warc.gz | 31315446 | download job |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8-00000.warc.os.cdx.gz | 71124 | download |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8-meta.warc.gz | 42497 | download job |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8-urls.txt | 13253 | download |
urls-archive.max.fan-twitter-@DieschbourgC-filtered.txt-shallow-20200712-164935-5nff8.json | 339 | download job |
urls-archive.max.fan-twitter-@DigiDiplomats-filtered.txt-shallow-20200712-164933-b0c2r-urls.txt | 134293 | download |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj-00000.warc.gz | 178759854 | download job |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj-00000.warc.os.cdx.gz | 186230 | download |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj-meta.warc.gz | 102345 | download job |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj-urls.txt | 175209 | download |
urls-archive.max.fan-twitter-@DigitalDionne-filtered.txt-shallow-20200712-164411-3xnmj.json | 341 | download job |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz-00000.warc.gz | 192931089 | download job |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz-00000.warc.os.cdx.gz | 236042 | download |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz-meta.warc.gz | 129346 | download job |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz-urls.txt | 114566 | download |
urls-archive.max.fan-twitter-@DisRightsTx-filtered.txt-shallow-20200712-162939-635vz.json | 337 | download job |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt-00000.warc.gz | 78514068 | download job |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt-00000.warc.os.cdx.gz | 70377 | download |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt-meta.warc.gz | 41938 | download job |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt-urls.txt | 27762 | download |
urls-archive.max.fan-twitter-@DonYoungAK-filtered.txt-shallow-20200712-162925-838yt.json | 335 | download job |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio-00000.warc.gz | 109145695 | download job |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio-00000.warc.os.cdx.gz | 125533 | download |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio-meta.warc.gz | 71815 | download job |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio-urls.txt | 32990 | download |
urls-archive.max.fan-twitter-@DougForDakota-filtered.txt-shallow-20200712-162922-7efio.json | 341 | download job |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z-00000.warc.gz | 16950199 | download job |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z-00000.warc.os.cdx.gz | 40658 | download |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z-meta.warc.gz | 26013 | download job |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z-urls.txt | 5278 | download |
urls-archive.max.fan-twitter-@DrMikeRyan-filtered.txt-shallow-20200712-162634-3su2z.json | 335 | download job |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb-00000.warc.gz | 299595820 | download job |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb-00000.warc.os.cdx.gz | 615255 | download |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb-meta.warc.gz | 329132 | download job |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb-urls.txt | 91511 | download |
urls-archive.max.fan-twitter-@DrMukhisaKituyi-filtered.txt-shallow-20200712-162600-e9swb.json | 345 | download job |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n-00000.warc.gz | 343310332 | download job |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n-00000.warc.os.cdx.gz | 525966 | download |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n-meta.warc.gz | 285087 | download job |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n-urls.txt | 182618 | download |
urls-archive.max.fan-twitter-@DrNancyM_CDC-filtered.txt-shallow-20200712-162548-7oi1n.json | 339 | download job |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6-00000.warc.gz | 239698365 | download job |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6-00000.warc.os.cdx.gz | 329489 | download |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6-meta.warc.gz | 178893 | download job |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6-urls.txt | 76940 | download |
urls-archive.max.fan-twitter-@DrNealDunnFL2-filtered.txt-shallow-20200712-162510-770x6.json | 341 | download job |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z-00000.warc.gz | 357168328 | download job |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z-00000.warc.os.cdx.gz | 1120883 | download |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z-meta.warc.gz | 591525 | download job |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z-urls.txt | 157605 | download |
urls-archive.max.fan-twitter-@DrTomFrieden-filtered.txt-shallow-20200712-162510-dkw9z.json | 339 | download job |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv-00000.warc.gz | 13674411 | download job |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv-00000.warc.os.cdx.gz | 61480 | download |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv-meta.warc.gz | 37533 | download job |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv-urls.txt | 6870 | download |
urls-archive.max.fan-twitter-@EMortimer-filtered.txt-shallow-20200712-154430-a3xrv.json | 333 | download job |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb-00000.warc.gz | 103429374 | download job |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb-00000.warc.os.cdx.gz | 237824 | download |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb-meta.warc.gz | 131900 | download job |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb-urls.txt | 20296 | download |
urls-archive.max.fan-twitter-@EPAAWheeler-filtered.txt-shallow-20200712-154234-6qwpb.json | 337 | download job |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3-00000.warc.gz | 1059084 | download job |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3-00000.warc.os.cdx.gz | 5331 | download |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3-meta.warc.gz | 6852 | download job |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3-urls.txt | 59 | download |
urls-archive.max.fan-twitter-@EPhilippe_LH-filtered.txt-shallow-20200712-154231-4yvc3.json | 339 | download job |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl-00000.warc.gz | 588355699 | download job |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl-00000.warc.os.cdx.gz | 687860 | download |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl-meta.warc.gz | 368088 | download job |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl-urls.txt | 386018 | download |
urls-archive.max.fan-twitter-@EPinDeutschland-filtered.txt-shallow-20200712-154230-4nhbl.json | 345 | download job |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969-00000.warc.gz | 476560450 | download job |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969-00000.warc.os.cdx.gz | 1048703 | download |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969-meta.warc.gz | 558085 | download job |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969-urls.txt | 271719 | download |
urls-archive.max.fan-twitter-@ESCochrane-filtered.txt-shallow-20200712-153550-1d969.json | 335 | download job |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum-00000.warc.gz | 5305037 | download job |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum-00000.warc.os.cdx.gz | 26205 | download |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum-meta.warc.gz | 18023 | download job |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum-urls.txt | 885 | download |
urls-archive.max.fan-twitter-@EdgarCLungu-filtered.txt-shallow-20200712-161721-c2zum.json | 337 | download job |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h-00000.warc.gz | 3728616 | download job |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h-00000.warc.os.cdx.gz | 8598 | download |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h-meta.warc.gz | 8796 | download job |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h-urls.txt | 2751 | download |
urls-archive.max.fan-twitter-@EdithLedererAP-filtered.txt-shallow-20200712-161654-c692h.json | 343 | download job |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0-00000.warc.gz | 645929239 | download job |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0-00000.warc.os.cdx.gz | 896882 | download |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0-meta.warc.gz | 477939 | download job |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0-urls.txt | 192712 | download |
urls-archive.max.fan-twitter-@EduCannotWait-filtered.txt-shallow-20200712-161652-1jit0.json | 341 | download job |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g-00000.warc.gz | 1146558402 | download job |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g-00000.warc.os.cdx.gz | 1098178 | download |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g-meta.warc.gz | 574468 | download job |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g-urls.txt | 341941 | download |
urls-archive.max.fan-twitter-@ElPasoTXGov-filtered.txt-shallow-20200712-160405-6lg2g.json | 337 | download job |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz-00000.warc.gz | 7931414 | download job |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz-00000.warc.os.cdx.gz | 21815 | download |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz-meta.warc.gz | 15879 | download job |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz-urls.txt | 2146 | download |
urls-archive.max.fan-twitter-@EleniForCA-filtered.txt-shallow-20200712-161650-3ejzz.json | 335 | download job |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd-00000.warc.gz | 370418145 | download job |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd-00000.warc.os.cdx.gz | 484430 | download |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd-meta.warc.gz | 262360 | download job |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd-urls.txt | 75434 | download |
urls-archive.max.fan-twitter-@EliasonMike-filtered.txt-shallow-20200712-161023-6peqd.json | 337 | download job |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak-00000.warc.gz | 543212193 | download job |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak-00000.warc.os.cdx.gz | 949216 | download |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak-meta.warc.gz | 500159 | download job |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak-urls.txt | 94442 | download |
urls-archive.max.fan-twitter-@Elisabeth_Borne-filtered.txt-shallow-20200712-161016-8dcak.json | 345 | download job |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1-00000.warc.gz | 86811194 | download job |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1-00000.warc.os.cdx.gz | 116269 | download |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1-meta.warc.gz | 65817 | download job |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1-urls.txt | 48737 | download |
urls-archive.max.fan-twitter-@EmbEspAtenas-filtered.txt-shallow-20200712-154748-4d2j1.json | 339 | download job |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx-00000.warc.gz | 14876568 | download job |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx-00000.warc.os.cdx.gz | 27038 | download |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx-meta.warc.gz | 19042 | download job |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx-urls.txt | 10692 | download |
urls-archive.max.fan-twitter-@EmmaBubola-filtered.txt-shallow-20200712-154437-6cetx.json | 335 | download job |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc-00000.warc.gz | 1000577 | download job |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc-00000.warc.os.cdx.gz | 4173 | download |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc-meta.warc.gz | 6213 | download job |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc-urls.txt | 61 | download |
urls-archive.max.fan-twitter-@Engelenburcht_-filtered.txt-shallow-20200712-154237-dkglc.json | 343 | download job |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m-00000.warc.gz | 17422762 | download job |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m-00000.warc.os.cdx.gz | 20734 | download |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m-meta.warc.gz | 15564 | download job |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m-urls.txt | 13474 | download |
urls-archive.max.fan-twitter-@Enstereo-filtered.txt-shallow-20200712-154237-4f91m.json | 331 | download job |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48-00000.warc.gz | 709864942 | download job |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48-00000.warc.os.cdx.gz | 971826 | download |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48-meta.warc.gz | 518780 | download job |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48-urls.txt | 608026 | download |
urls-archive.max.fan-twitter-@EricCarvin-filtered.txt-shallow-20200712-154227-b4k48.json | 335 | download job |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe-00000.warc.gz | 4357749 | download job |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe-00000.warc.os.cdx.gz | 9345 | download |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe-meta.warc.gz | 9166 | download job |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe-urls.txt | 2867 | download |
urls-archive.max.fan-twitter-@EricSchertzing-filtered.txt-shallow-20200712-153624-f0khe.json | 343 | download job |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d-00000.warc.gz | 452199728 | download job |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d-00000.warc.os.cdx.gz | 852251 | download |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d-meta.warc.gz | 447723 | download job |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d-urls.txt | 61768 | download |
urls-archive.max.fan-twitter-@EsperDoD-filtered.txt-shallow-20200712-153420-eyq3d.json | 331 | download job |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv-00000.warc.gz | 234098414 | download job |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv-00000.warc.os.cdx.gz | 679469 | download |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv-meta.warc.gz | 367567 | download job |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv-urls.txt | 77161 | download |
urls-archive.max.fan-twitter-@EstherMcVey1-filtered.txt-shallow-20200712-153245-bqiiv.json | 339 | download job |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf-00000.warc.gz | 11500368 | download job |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf-00000.warc.os.cdx.gz | 20484 | download |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf-meta.warc.gz | 15205 | download job |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf-urls.txt | 2166 | download |
urls-archive.max.fan-twitter-@EstoniaUN-filtered.txt-shallow-20200712-153243-eb2lf.json | 333 | download job |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k-00000.warc.gz | 6032198 | download job |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k-00000.warc.os.cdx.gz | 9720 | download |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k-meta.warc.gz | 9326 | download job |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k-urls.txt | 1652 | download |
urls-archive.max.fan-twitter-@Europarl_BG-filtered.txt-shallow-20200712-153204-9al3k.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s-00000.warc.gz | 172947049 | download job |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s-00000.warc.os.cdx.gz | 195650 | download |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s-meta.warc.gz | 109319 | download job |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s-urls.txt | 52982 | download |
urls-archive.max.fan-twitter-@Europarl_CS-filtered.txt-shallow-20200712-153202-6fr1s.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o-00000.warc.gz | 265756516 | download job |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o-00000.warc.os.cdx.gz | 618831 | download |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o-meta.warc.gz | 334360 | download job |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o-urls.txt | 50327 | download |
urls-archive.max.fan-twitter-@Europarl_EN-filtered.txt-shallow-20200712-153114-2cj4o.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q-00000.warc.gz | 81778192 | download job |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q-00000.warc.os.cdx.gz | 87108 | download |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q-meta.warc.gz | 51147 | download job |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q-urls.txt | 24072 | download |
urls-archive.max.fan-twitter-@Europarl_HU-filtered.txt-shallow-20200712-153110-4rr1q.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs-00000.warc.gz | 1348022818 | download job |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs-00000.warc.os.cdx.gz | 1881337 | download |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs-meta.warc.gz | 1000842 | download job |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs-urls.txt | 558436 | download |
urls-archive.max.fan-twitter-@Europarl_IT-filtered.txt-shallow-20200712-152740-b13rs.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4-00000.warc.gz | 84105481 | download job |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4-00000.warc.os.cdx.gz | 72788 | download |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4-meta.warc.gz | 43313 | download job |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4-urls.txt | 28615 | download |
urls-archive.max.fan-twitter-@Europarl_LT-filtered.txt-shallow-20200712-152738-5axh4.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0-00000.warc.gz | 160545222 | download job |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0-00000.warc.os.cdx.gz | 132012 | download |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0-meta.warc.gz | 74309 | download job |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0-urls.txt | 49913 | download |
urls-archive.max.fan-twitter-@Europarl_LV-filtered.txt-shallow-20200712-152345-btyq0.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g-00000.warc.gz | 160130420 | download job |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g-00000.warc.os.cdx.gz | 216248 | download |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g-meta.warc.gz | 119431 | download job |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g-urls.txt | 49088 | download |
urls-archive.max.fan-twitter-@Europarl_PL-filtered.txt-shallow-20200712-152345-cqp9g.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7-00000.warc.gz | 117170826 | download job |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7-00000.warc.os.cdx.gz | 140530 | download |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7-meta.warc.gz | 79742 | download job |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7-urls.txt | 35990 | download |
urls-archive.max.fan-twitter-@Europarl_PT-filtered.txt-shallow-20200712-152202-4hdn7.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x-00000.warc.gz | 110968095 | download job |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x-00000.warc.os.cdx.gz | 114847 | download |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x-meta.warc.gz | 65907 | download job |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x-urls.txt | 33099 | download |
urls-archive.max.fan-twitter-@Europarl_RO-filtered.txt-shallow-20200712-152201-4a20x.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc-00000.warc.gz | 72573677 | download job |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc-00000.warc.os.cdx.gz | 77799 | download |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc-meta.warc.gz | 46186 | download job |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc-urls.txt | 22420 | download |
urls-archive.max.fan-twitter-@Europarl_da-filtered.txt-shallow-20200712-153158-ddxzc.json | 337 | download job |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm-00000.warc.gz | 1804326919 | download job |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm-00000.warc.os.cdx.gz | 1200800 | download |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm-meta.warc.gz | 636623 | download job |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm-urls.txt | 701554 | download |
urls-archive.max.fan-twitter-@Europarl_sv-filtered.txt-shallow-20200712-152055-34vtm.json | 337 | download job |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9-00000.warc.gz | 18318279 | download job |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9-00000.warc.os.cdx.gz | 26808 | download |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9-meta.warc.gz | 18944 | download job |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9-urls.txt | 5280 | download |
urls-archive.max.fan-twitter-@EvaKjerHansen-filtered.txt-shallow-20200712-152046-dlgr9.json | 341 | download job |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew-00000.warc.gz | 507671284 | download job |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew-00000.warc.os.cdx.gz | 570894 | download |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew-meta.warc.gz | 304318 | download job |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew-urls.txt | 262809 | download |
urls-archive.max.fan-twitter-@Evins-filtered.txt-shallow-20200712-151612-3buew.json | 325 | download job |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf-00000.warc.gz | 271640566 | download job |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf-00000.warc.os.cdx.gz | 335164 | download |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf-meta.warc.gz | 183786 | download job |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf-urls.txt | 157039 | download |
urls-archive.max.fan-twitter-@FAOWFD-filtered.txt-shallow-20200712-150257-8kmuf.json | 327 | download job |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du-00000.warc.gz | 2142284735 | download job |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du-00000.warc.os.cdx.gz | 1959724 | download |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du-meta.warc.gz | 1024980 | download job |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du-urls.txt | 964492 | download |
urls-archive.max.fan-twitter-@FAOWHOCodex-filtered.txt-shallow-20200712-150037-6h1du.json | 337 | download job |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t-00000.warc.gz | 494671392 | download job |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t-00000.warc.os.cdx.gz | 617668 | download |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t-meta.warc.gz | 333836 | download job |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t-urls.txt | 175692 | download |
urls-archive.max.fan-twitter-@FEMAespanol-filtered.txt-shallow-20200712-145643-9bn0t.json | 337 | download job |
urls-archive.max.fan-twitter-@FLSecofState-filtered.txt-shallow-20200712-143843-6en3a.json | 339 | download job |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7-00000.warc.gz | 1835262110 | download job |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7-00000.warc.os.cdx.gz | 2035889 | download |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7-meta.warc.gz | 1078811 | download job |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7-urls.txt | 505594 | download |
urls-archive.max.fan-twitter-@FP_Champagne-filtered.txt-shallow-20200712-142440-8ieb7.json | 339 | download job |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi-00000.warc.gz | 36410512 | download job |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi-00000.warc.os.cdx.gz | 87344 | download |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi-meta.warc.gz | 51373 | download job |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi-urls.txt | 12993 | download |
urls-archive.max.fan-twitter-@FabianLeedsNE-filtered.txt-shallow-20200712-150735-dlnvi.json | 341 | download job |
urls-archive.max.fan-twitter-@FactTank-filtered.txt-shallow-20200712-150323-eprv1-urls.txt | 1251755 | download |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd-00000.warc.gz | 478517940 | download job |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd-00000.warc.os.cdx.gz | 411377 | download |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd-meta.warc.gz | 218581 | download job |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd-urls.txt | 130089 | download |
urls-archive.max.fan-twitter-@FeroRuzicka-filtered.txt-shallow-20200712-145621-4l2zd.json | 337 | download job |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x-00000.warc.gz | 441339729 | download job |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x-00000.warc.os.cdx.gz | 1057630 | download |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x-meta.warc.gz | 564665 | download job |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x-urls.txt | 97802 | download |
urls-archive.max.fan-twitter-@FilippoGrandi-filtered.txt-shallow-20200712-145207-8l06x.json | 341 | download job |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx-00000.warc.gz | 1077375209 | download job |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx-00000.warc.os.cdx.gz | 955701 | download |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx-meta.warc.gz | 516863 | download job |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx-urls.txt | 267405 | download |
urls-archive.max.fan-twitter-@FilomenaTassi-filtered.txt-shallow-20200712-144900-9upcx.json | 341 | download job |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb-00000.warc.gz | 426233747 | download job |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb-00000.warc.os.cdx.gz | 466976 | download |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb-meta.warc.gz | 251899 | download job |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb-urls.txt | 160885 | download |
urls-archive.max.fan-twitter-@FireAviationNPS-filtered.txt-shallow-20200712-144833-5p0lb.json | 345 | download job |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck-00000.warc.gz | 825463737 | download job |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck-00000.warc.os.cdx.gz | 1282186 | download |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck-meta.warc.gz | 681267 | download job |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck-urls.txt | 271596 | download |
urls-archive.max.fan-twitter-@FlesselLaura-filtered.txt-shallow-20200712-144832-bjlck.json | 339 | download job |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s-00000.warc.gz | 222027529 | download job |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s-00000.warc.os.cdx.gz | 236775 | download |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s-meta.warc.gz | 129943 | download job |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s-urls.txt | 151437 | download |
urls-archive.max.fan-twitter-@FloIriondo-filtered.txt-shallow-20200712-144830-3t02s.json | 335 | download job |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr-meta.warc.gz | 86698 | download job |
urls-archive.max.fan-twitter-@FluNearYou-filtered.txt-shallow-20200712-143319-64zpr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FonsecaAP-filtered.txt-shallow-20200712-142619-8evkl-urls.txt | 49945 | download |
urls-archive.max.fan-twitter-@ForIdahoRefugee-filtered.txt-shallow-20200712-142529-70icl.json | 345 | download job |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg-00000.warc.gz | 957632426 | download job |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg-00000.warc.os.cdx.gz | 2109988 | download |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg-meta.warc.gz | 1114538 | download job |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg-urls.txt | 756805 | download |
urls-archive.max.fan-twitter-@FrancesRobles-filtered.txt-shallow-20200712-142040-1kqtg.json | 341 | download job |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr-00000.warc.gz | 72506416 | download job |
urls-archive.max.fan-twitter-@FredMonyak-filtered.txt-shallow-20200712-141624-ddstr-00000.warc.os.cdx.gz | 191134 | download |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u-00000.warc.gz | 712218141 | download job |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u-00000.warc.os.cdx.gz | 1035354 | download |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u-meta.warc.gz | 550940 | download job |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u-urls.txt | 114956 | download |
urls-archive.max.fan-twitter-@FreedomHKG-filtered.txt-shallow-20200712-141621-ezb7u.json | 335 | download job |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45-meta.warc.gz | 327407 | download job |
urls-archive.max.fan-twitter-@FundacionONU-filtered.txt-shallow-20200712-141242-6cv45-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me-00000.warc.gz | 1845889993 | download job |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me-00000.warc.os.cdx.gz | 3292762 | download |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me-meta.warc.gz | 1732510 | download job |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me-urls.txt | 212313 | download |
urls-archive.max.fan-twitter-@GOP-filtered.txt-shallow-20200712-132345-9x4me.json | 321 | download job |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n-00000.warc.gz | 559948040 | download job |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n-00000.warc.os.cdx.gz | 877646 | download |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n-meta.warc.gz | 470357 | download job |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n-urls.txt | 377768 | download |
urls-archive.max.fan-twitter-@GaRepublicans-filtered.txt-shallow-20200712-140422-8k08n.json | 341 | download job |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di-00000.warc.gz | 1022524135 | download job |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di-00000.warc.os.cdx.gz | 1101867 | download |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di-meta.warc.gz | 587244 | download job |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di-urls.txt | 373178 | download |
urls-archive.max.fan-twitter-@GenevaImpact-filtered.txt-shallow-20200712-135509-2x2di.json | 339 | download job |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl-00000.warc.gz | 1329295018 | download job |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl-00000.warc.os.cdx.gz | 1768623 | download |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl-meta.warc.gz | 935472 | download job |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl-urls.txt | 418723 | download |
urls-archive.max.fan-twitter-@GermanyUN-filtered.txt-shallow-20200712-135309-4k2dl.json | 333 | download job |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho-00000.warc.gz | 328708348 | download job |
urls-archive.max.fan-twitter-@GlobalEduFirst-filtered.txt-shallow-20200712-133420-au5ho-00000.warc.os.cdx.gz | 677891 | download |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1-00000.warc.gz | 1352815041 | download job |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1-00000.warc.os.cdx.gz | 1619413 | download |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1-meta.warc.gz | 851479 | download job |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1-urls.txt | 1140446 | download |
urls-archive.max.fan-twitter-@GouvGN-filtered.txt-shallow-20200712-132219-bbsq1.json | 327 | download job |
urls-archive.max.fan-twitter-@GovChrisSununu-filtered.txt-shallow-20200712-131219-b7exz-urls.txt | 220895 | download |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg-00000.warc.gz | 1457738073 | download job |
urls-archive.max.fan-twitter-@GovMattBevin-filtered.txt-shallow-20200712-124421-buhrg-00000.warc.os.cdx.gz | 2328282 | download |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l-00000.warc.gz | 1409255772 | download job |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l-00000.warc.os.cdx.gz | 3327610 | download |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l-meta.warc.gz | 1771872 | download job |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l-urls.txt | 341809 | download |
urls-archive.max.fan-twitter-@GovMurphy-filtered.txt-shallow-20200712-122544-19b9l.json | 333 | download job |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1-00000.warc.gz | 939546893 | download job |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1-00000.warc.os.cdx.gz | 1877908 | download |
urls-archive.max.fan-twitter-@GovernorBullock-filtered.txt-shallow-20200712-130345-88oi1-urls.txt | 514443 | download |
urls-archive.max.fan-twitter-@HayesBrown-filtered.txt-shallow-20200712-120237-5xr1i-00000.warc.gz | 5368752033 | download job |
urls-archive.max.fan-twitter-@HayesBrown-filtered.txt-shallow-20200712-120237-5xr1i-00000.warc.os.cdx.gz | 4561727 | download |
urls-archive.max.fan-twitter-@Herring_NBA-filtered.txt-shallow-20200712-115000-9dhnu-00000.warc.gz | 5368760676 | download job |
urls-archive.max.fan-twitter-@Herring_NBA-filtered.txt-shallow-20200712-115000-9dhnu-00000.warc.os.cdx.gz | 4409781 | download |
urls-archive.max.fan-twitter-@Herring_NBA-filtered.txt-shallow-20200712-115000-9dhnu-00001.warc.gz | 2330954634 | download job |
urls-archive.max.fan-twitter-@Herring_NBA-filtered.txt-shallow-20200712-115000-9dhnu-00001.warc.os.cdx.gz | 6015409 | download |
urls-archive.max.fan-twitter-@daldenAP-filtered.txt-shallow-20200712-171402-bm044-00000.warc.gz | 4443996 | download job |
urls-archive.max.fan-twitter-@daldenAP-filtered.txt-shallow-20200712-171402-bm044-00000.warc.os.cdx.gz | 7014 | download |
urls-archive.max.fan-twitter-@daldenAP-filtered.txt-shallow-20200712-171402-bm044-meta.warc.gz | 7807 | download job |
urls-archive.max.fan-twitter-@daldenAP-filtered.txt-shallow-20200712-171402-bm044-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@danablanton_nyc-filtered.txt-shallow-20200712-171350-dihmz-urls.txt | 26047 | download |
urls-archive.max.fan-twitter-@dannyhakim-filtered.txt-shallow-20200712-171332-av04k-meta.warc.gz | 387036 | download job |
urls-archive.max.fan-twitter-@dannyhakim-filtered.txt-shallow-20200712-171332-av04k-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@davidzucchino-filtered.txt-shallow-20200712-170359-3oh7h-urls.txt | 27648 | download |
urls-archive.max.fan-twitter-@dclark5-filtered.txt-shallow-20200712-170352-gv72j-urls.txt | 23872 | download |
urls-archive.max.fan-twitter-@deepakm71-filtered.txt-shallow-20200712-170326-8im46-urls.txt | 24066 | download |
urls-archive.max.fan-twitter-@demosisto-filtered.txt-shallow-20200712-165836-8945h-00000.warc.gz | 671952856 | download job |
urls-archive.max.fan-twitter-@demosisto-filtered.txt-shallow-20200712-165836-8945h-00000.warc.os.cdx.gz | 963220 | download |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2-00000.warc.gz | 14449335 | download job |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2-00000.warc.os.cdx.gz | 27037 | download |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2-meta.warc.gz | 18955 | download job |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2-urls.txt | 9709 | download |
urls-archive.max.fan-twitter-@dhajela-filtered.txt-shallow-20200712-165356-1jsw2.json | 329 | download job |
urls-archive.max.fan-twitter-@dhopkins1776-filtered.txt-shallow-20200712-165351-gio9w-meta.warc.gz | 119909 | download job |
urls-archive.max.fan-twitter-@dhopkins1776-filtered.txt-shallow-20200712-165351-gio9w-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dhopkins1776-filtered.txt-shallow-20200712-165351-gio9w-urls.txt | 61757 | download |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly-00000.warc.gz | 53515316 | download job |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly-00000.warc.os.cdx.gz | 114374 | download |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly-meta.warc.gz | 66095 | download job |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly-urls.txt | 46578 | download |
urls-archive.max.fan-twitter-@dinacappiello-filtered.txt-shallow-20200712-164406-6scly.json | 341 | download job |
urls-archive.max.fan-twitter-@dionnesearcey-filtered.txt-shallow-20200712-164404-by5xx-meta.warc.gz | 326794 | download job |
urls-archive.max.fan-twitter-@dionnesearcey-filtered.txt-shallow-20200712-164404-by5xx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dionnesearcey-filtered.txt-shallow-20200712-164404-by5xx-urls.txt | 173452 | download |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm-00000.warc.gz | 457856489 | download job |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm-00000.warc.os.cdx.gz | 1257237 | download |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm-meta.warc.gz | 662934 | download job |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm-urls.txt | 122074 | download |
urls-archive.max.fan-twitter-@dougmillsnyt-filtered.txt-shallow-20200712-162817-29kqm.json | 339 | download job |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7-00000.warc.gz | 8566339 | download job |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7-00000.warc.os.cdx.gz | 22624 | download |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7-meta.warc.gz | 16317 | download job |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7-urls.txt | 2596 | download |
urls-archive.max.fan-twitter-@drcarolinej-filtered.txt-shallow-20200712-162813-9nfm7.json | 337 | download job |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0-00000.warc.gz | 3412124 | download job |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0-00000.warc.os.cdx.gz | 9646 | download |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0-meta.warc.gz | 9306 | download job |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0-urls.txt | 2183 | download |
urls-archive.max.fan-twitter-@dustcloud_io-filtered.txt-shallow-20200712-162503-3jys0.json | 339 | download job |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n-00000.warc.gz | 11007951 | download job |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n-00000.warc.os.cdx.gz | 15059 | download |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n-meta.warc.gz | 12405 | download job |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n-urls.txt | 6729 | download |
urls-archive.max.fan-twitter-@dutch3stef-filtered.txt-shallow-20200712-162045-89w3n.json | 335 | download job |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh-00000.warc.gz | 110943815 | download job |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh-00000.warc.os.cdx.gz | 126897 | download |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh-meta.warc.gz | 72114 | download job |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh-urls.txt | 69901 | download |
urls-archive.max.fan-twitter-@dylanlovan-filtered.txt-shallow-20200712-162044-nu5gh.json | 335 | download job |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta-00000.warc.gz | 4684525 | download job |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta-00000.warc.os.cdx.gz | 20686 | download |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta-meta.warc.gz | 15583 | download job |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta-urls.txt | 2684 | download |
urls-archive.max.fan-twitter-@ebola_response-filtered.txt-shallow-20200712-162042-be8ta.json | 343 | download job |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy-00000.warc.gz | 1008989022 | download job |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy-00000.warc.os.cdx.gz | 3027029 | download |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy-meta.warc.gz | 1583104 | download job |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy-urls.txt | 750539 | download |
urls-archive.max.fan-twitter-@elianayjohnson-filtered.txt-shallow-20200712-161027-3bcgy.json | 343 | download job |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor-00000.warc.gz | 45965226 | download job |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor-00000.warc.os.cdx.gz | 180937 | download |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor-meta.warc.gz | 100266 | download job |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor-urls.txt | 27582 | download |
urls-archive.max.fan-twitter-@elizabethjdias-filtered.txt-shallow-20200712-160408-1laor.json | 343 | download job |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh-00000.warc.gz | 23068349 | download job |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh-00000.warc.os.cdx.gz | 49507 | download |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh-meta.warc.gz | 30986 | download job |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh-urls.txt | 13211 | download |
urls-archive.max.fan-twitter-@elliotspagat-filtered.txt-shallow-20200712-160407-328dh.json | 339 | download job |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d-00000.warc.gz | 11833378 | download job |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d-00000.warc.os.cdx.gz | 32452 | download |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d-meta.warc.gz | 21601 | download job |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d-urls.txt | 4897 | download |
urls-archive.max.fan-twitter-@elsiechenyi-filtered.txt-shallow-20200712-154751-2is6d.json | 337 | download job |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq-00000.warc.gz | 409285990 | download job |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq-00000.warc.os.cdx.gz | 1124975 | download |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq-meta.warc.gz | 604449 | download job |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq-urls.txt | 309004 | download |
urls-archive.max.fan-twitter-@emilysteel-filtered.txt-shallow-20200712-154741-6escq.json | 335 | download job |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2-00000.warc.gz | 160089671 | download job |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2-00000.warc.os.cdx.gz | 291616 | download |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2-meta.warc.gz | 158868 | download job |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2-urls.txt | 105531 | download |
urls-archive.max.fan-twitter-@emmabgo-filtered.txt-shallow-20200712-154738-dfhm2.json | 329 | download job |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk-00000.warc.gz | 780825475 | download job |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk-00000.warc.os.cdx.gz | 1371429 | download |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk-meta.warc.gz | 718510 | download job |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk-urls.txt | 310281 | download |
urls-archive.max.fan-twitter-@emoctezumab-filtered.txt-shallow-20200712-154436-771pk.json | 337 | download job |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc-00000.warc.gz | 540138528 | download job |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc-00000.warc.os.cdx.gz | 584598 | download |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc-meta.warc.gz | 313634 | download job |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc-urls.txt | 388996 | download |
urls-archive.max.fan-twitter-@energyaccessPN-filtered.txt-shallow-20200712-154429-bn4jc.json | 343 | download job |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9-00000.warc.gz | 114796634 | download job |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9-00000.warc.os.cdx.gz | 497379 | download |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9-meta.warc.gz | 266738 | download job |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9-urls.txt | 27540 | download |
urls-archive.max.fan-twitter-@ericswalwell-filtered.txt-shallow-20200712-153623-agev9.json | 339 | download job |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs-00000.warc.gz | 84856432 | download job |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs-00000.warc.os.cdx.gz | 100616 | download |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs-meta.warc.gz | 58094 | download job |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs-urls.txt | 77837 | download |
urls-archive.max.fan-twitter-@ericthayer-filtered.txt-shallow-20200712-153602-2wfjs.json | 335 | download job |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs-00000.warc.gz | 15948690 | download job |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs-00000.warc.os.cdx.gz | 40745 | download |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs-meta.warc.gz | 26194 | download job |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs-urls.txt | 5911 | download |
urls-archive.max.fan-twitter-@erinschaff-filtered.txt-shallow-20200712-153551-70vvs.json | 335 | download job |
urls-archive.max.fan-twitter-@evoespueblo-filtered.txt-shallow-20200712-151610-457o0-meta.warc.gz | 3122851 | download job |
urls-archive.max.fan-twitter-@evoespueblo-filtered.txt-shallow-20200712-151610-457o0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf-00000.warc.gz | 154995000 | download job |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf-00000.warc.os.cdx.gz | 612431 | download |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf-meta.warc.gz | 328687 | download job |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf-urls.txt | 31020 | download |
urls-archive.max.fan-twitter-@ewarren-filtered.txt-shallow-20200712-150735-67llf.json | 329 | download job |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78-00000.warc.gz | 448562197 | download job |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78-00000.warc.os.cdx.gz | 872314 | download |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78-meta.warc.gz | 464818 | download job |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78-urls.txt | 120645 | download |
urls-archive.max.fan-twitter-@florence_parly-filtered.txt-shallow-20200712-144806-bkp78.json | 343 | download job |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134-00000.warc.gz | 463482826 | download job |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134-00000.warc.os.cdx.gz | 1074955 | download |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134-meta.warc.gz | 575795 | download job |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134-urls.txt | 240530 | download |
urls-archive.max.fan-twitter-@florian_krammer-filtered.txt-shallow-20200712-143850-9t134.json | 345 | download job |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p-meta.warc.gz | 94507 | download job |
urls-archive.max.fan-twitter-@flynnkaNYT-filtered.txt-shallow-20200712-143319-96f0p-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq-00000.warc.gz | 4109972217 | download job |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq-00000.warc.os.cdx.gz | 4944831 | download |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq-meta.warc.gz | 2577668 | download job |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq-urls.txt | 1174656 | download |
urls-archive.max.fan-twitter-@franceonu-filtered.txt-shallow-20200712-142041-6zmgq.json | 333 | download job |
urls-archive.max.fan-twitter-@franniemkoba-filtered.txt-shallow-20200712-141754-204uq.json | 339 | download job |
urls-archive.max.fan-twitter-@gabriellaangojo-filtered.txt-shallow-20200712-141242-zhqht-urls.txt | 25706 | download |
urls-archive.max.fan-twitter-@gflaccus-filtered.txt-shallow-20200712-135305-3eaae-urls.txt | 112415 | download |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4-00000.warc.gz | 980547014 | download job |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4-00000.warc.os.cdx.gz | 1047226 | download |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4-meta.warc.gz | 555055 | download job |
urls-archive.max.fan-twitter-@globalnyc-filtered.txt-shallow-20200712-132832-1ycz4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k-meta.warc.gz | 545392 | download job |
urls-archive.max.fan-twitter-@goonj-filtered.txt-shallow-20200712-132827-9t77k-meta.warc.os.cdx.gz | 47 | download |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10-00000.warc.gz | 290556877 | download job |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10-00000.warc.os.cdx.gz | 367419 | download |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10-meta.warc.gz | 243792 | download job |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10-meta.warc.os.cdx.gz | 47 | download |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10-urls.txt | 20037 | download |
urls-transfer.notkiska.pw-facebook-@DiscoverPinetop-shallow-20200712-155804-cym10.json | 344 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00210.warc.gz | 6345412163 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackHistoryMonth-shallow-20200610-132545-46qdq-00210.warc.os.cdx.gz | 13319 | download |
urls-transfer.notkiska.pw-twitter-%23BlackTwitter-shallow-20200710-163004-dpwry-00003.warc.gz | 5368726041 | download job |
urls-transfer.notkiska.pw-twitter-%23BlackTwitter-shallow-20200710-163004-dpwry-00003.warc.os.cdx.gz | 7322702 | download |
urls-transfer.notkiska.pw-twitter-%23Srebrenitsa-shallow-20200711-202724-ccuwz-00002.warc.gz | 5369910890 | download job |
urls-transfer.notkiska.pw-twitter-%23Srebrenitsa-shallow-20200711-202724-ccuwz-00002.warc.os.cdx.gz | 5202175 | download |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00129.warc.gz | 5369021071 | download job |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00129.warc.os.cdx.gz | 1755353 | download |
urls-transfer.notkiska.pw-twitter-@bonappetit-shallow-20200712-003605-9ajtk-00001.warc.gz | 5369357835 | download job |
urls-transfer.notkiska.pw-twitter-@bonappetit-shallow-20200712-003605-9ajtk-00001.warc.os.cdx.gz | 6463964 | download |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00082.warc.gz | 5376749890 | download job |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00082.warc.os.cdx.gz | 477745 | download |
urls-transfer.notkiska.pw-www.cfr.org_rerun_403s.txt-shallow-20200712-171252-9migq-aborted-00000.warc.gz | 4324758 | download job |
urls-transfer.notkiska.pw-www.cfr.org_rerun_403s.txt-shallow-20200712-171252-9migq-aborted-00000.warc.os.cdx.gz | 96885 | download |
urls-transfer.notkiska.pw-www.cfr.org_rerun_403s.txt-shallow-20200712-171252-9migq-aborted.json | 344 | download job |
urls-transfer.notkiska.pw-www.cfr403s.txt-shallow-20200712-161440-2cotg-aborted-00000.warc.gz | 6073470 | download job |
urls-transfer.notkiska.pw-www.cfr403s.txt-shallow-20200712-161440-2cotg-aborted-00000.warc.os.cdx.gz | 166147 | download |
urls-transfer.notkiska.pw-www.cfr403s.txt-shallow-20200712-161440-2cotg-aborted-wpull.log.gz | 77050 | download |
urls-transfer.notkiska.pw-www.cfr403s.txt-shallow-20200712-161440-2cotg-aborted.json | 322 | download job |
www.bukarest.balassiintezet.hu-inf-20200707-090517-doafk-00002.warc.gz | 5369044533 | download job |
www.bukarest.balassiintezet.hu-inf-20200707-090517-doafk-00002.warc.os.cdx.gz | 4358768 | download |
www.cfr.org-shallow-20200712-175046-f2oeg-00000.warc.gz | 11875 | download job |
www.cfr.org-shallow-20200712-175046-f2oeg-00000.warc.os.cdx.gz | 274 | download |
www.cfr.org-shallow-20200712-175046-f2oeg-meta.warc.gz | 3575 | download job |
www.cfr.org-shallow-20200712-175046-f2oeg-meta.warc.os.cdx.gz | 47 | download |
www.discoverpinetop.com-inf-20200712-155843-srlkz-00000.warc.gz | 184329898 | download job |
www.discoverpinetop.com-inf-20200712-155843-srlkz-00000.warc.os.cdx.gz | 245638 | download |
www.discoverpinetop.com-inf-20200712-155843-srlkz-meta.warc.gz | 174866 | download job |
www.discoverpinetop.com-inf-20200712-155843-srlkz-meta.warc.os.cdx.gz | 47 | download |
www.discoverpinetop.com-inf-20200712-155843-srlkz.json | 253 | download job |
www.refinery29.com-inf-20191002-211042-3symg-00658.warc.gz | 5368709921 | download job |
www.refinery29.com-inf-20191002-211042-3symg-00658.warc.os.cdx.gz | 2176443 | download |
yepan.tistory.com-inf-20200711-025221-cq5rp-00006.warc.gz | 5383037473 | download job |
yepan.tistory.com-inf-20200711-025221-cq5rp-00006.warc.os.cdx.gz | 3420426 | download |
yepan.tistory.com-inf-20200711-025221-cq5rp-00007.warc.gz | 5369152938 | download job |
yepan.tistory.com-inf-20200711-025221-cq5rp-00007.warc.os.cdx.gz | 2737438 | download |