Item archiveteam_archivebot_go_20200710200001

View on Internet Archive

Filename Size
110000bjcc.12371.cn-inf-20200710-172823-4j7bz-00000.warc.gz 2482 download   job
110000bjcc.12371.cn-inf-20200710-172823-4j7bz-00000.warc.os.cdx.gz 47 download
110000bjcc.12371.cn-inf-20200710-172823-4j7bz-meta.warc.gz 3575 download   job
110000bjcc.12371.cn-inf-20200710-172823-4j7bz-meta.warc.os.cdx.gz 47 download
110000bjcc.12371.cn-inf-20200710-172823-4j7bz.json 248 download   job
140100sxdygbjy.12371.cn-inf-20200710-172904-agm2f-00000.warc.gz 2486 download   job
140100sxdygbjy.12371.cn-inf-20200710-172904-agm2f-00000.warc.os.cdx.gz 47 download
140100sxdygbjy.12371.cn-inf-20200710-172904-agm2f-meta.warc.gz 3580 download   job
140100sxdygbjy.12371.cn-inf-20200710-172904-agm2f-meta.warc.os.cdx.gz 47 download
140100sxdygbjy.12371.cn-inf-20200710-172904-agm2f.json 252 download   job
370000qlxf.12371.cn-inf-20200710-172936-3ijoz-00000.warc.gz 2483 download   job
370000qlxf.12371.cn-inf-20200710-172936-3ijoz-00000.warc.os.cdx.gz 47 download
370000qlxf.12371.cn-inf-20200710-172936-3ijoz-meta.warc.gz 3577 download   job
370000qlxf.12371.cn-inf-20200710-172936-3ijoz-meta.warc.os.cdx.gz 47 download
370000qlxf.12371.cn-inf-20200710-172936-3ijoz.json 248 download   job
420000jcqzw.12371.cn-inf-20200710-172949-7s3xh-00000.warc.gz 2483 download   job
420000jcqzw.12371.cn-inf-20200710-172949-7s3xh-00000.warc.os.cdx.gz 47 download
420000jcqzw.12371.cn-inf-20200710-172949-7s3xh-meta.warc.gz 3572 download   job
420000jcqzw.12371.cn-inf-20200710-172949-7s3xh-meta.warc.os.cdx.gz 47 download
420000jcqzw.12371.cn-inf-20200710-172949-7s3xh.json 249 download   job
440000gdycjy.12371.cn-inf-20200710-173008-28vk3-00000.warc.gz 2488 download   job
440000gdycjy.12371.cn-inf-20200710-173008-28vk3-00000.warc.os.cdx.gz 47 download
440000gdycjy.12371.cn-inf-20200710-173008-28vk3-meta.warc.gz 3589 download   job
440000gdycjy.12371.cn-inf-20200710-173008-28vk3-meta.warc.os.cdx.gz 47 download
440000gdycjy.12371.cn-inf-20200710-173008-28vk3.json 250 download   job
450000bgxf.12371.cn-inf-20200710-173022-61nx8-00000.warc.gz 2481 download   job
450000bgxf.12371.cn-inf-20200710-173022-61nx8-00000.warc.os.cdx.gz 47 download
450000bgxf.12371.cn-inf-20200710-173022-61nx8-meta.warc.gz 3503 download   job
450000bgxf.12371.cn-inf-20200710-173022-61nx8-meta.warc.os.cdx.gz 47 download
450000bgxf.12371.cn-inf-20200710-173022-61nx8.json 248 download   job
apps.12371.cn-inf-20200710-173040-2accg-00000.warc.gz 2469 download   job
apps.12371.cn-inf-20200710-173040-2accg-00000.warc.os.cdx.gz 47 download
apps.12371.cn-inf-20200710-173040-2accg-meta.warc.gz 3480 download   job
apps.12371.cn-inf-20200710-173040-2accg-meta.warc.os.cdx.gz 47 download
apps.12371.cn-inf-20200710-173040-2accg.json 242 download   job
archiveteam_archivebot_go_20200710200001.cdx.gz 134433256 download
archiveteam_archivebot_go_20200710200001.cdx.idx 112778 download
archiveteam_archivebot_go_20200710200001_files.xml 0 download
archiveteam_archivebot_go_20200710200001_meta.sqlite 982016 download
archiveteam_archivebot_go_20200710200001_meta.xml 969 download
bbs.12371.cn-inf-20200710-173051-10g0m-00000.warc.gz 2464 download   job
bbs.12371.cn-inf-20200710-173051-10g0m-00000.warc.os.cdx.gz 47 download
bbs.12371.cn-inf-20200710-173051-10g0m-meta.warc.gz 3535 download   job
bbs.12371.cn-inf-20200710-173051-10g0m-meta.warc.os.cdx.gz 47 download
bbs.12371.cn-inf-20200710-173051-10g0m.json 241 download   job
biaozhang.12371.cn-inf-20200710-173131-2oqph-00000.warc.gz 4476676 download   job
biaozhang.12371.cn-inf-20200710-173131-2oqph-00000.warc.os.cdx.gz 11699 download
biaozhang.12371.cn-inf-20200710-173131-2oqph-meta.warc.gz 10654 download   job
biaozhang.12371.cn-inf-20200710-173131-2oqph-meta.warc.os.cdx.gz 47 download
biaozhang.12371.cn-inf-20200710-173131-2oqph.json 247 download   job
blog.12371.cn-inf-20200710-173156-anw4s-00000.warc.gz 6237 download   job
blog.12371.cn-inf-20200710-173156-anw4s-00000.warc.os.cdx.gz 288 download
blog.12371.cn-inf-20200710-173156-anw4s-meta.warc.gz 3512 download   job
blog.12371.cn-inf-20200710-173156-anw4s-meta.warc.os.cdx.gz 47 download
blog.12371.cn-inf-20200710-173156-anw4s.json 242 download   job
cleaning.12371.cn-inf-20200710-173213-9h4mm-00000.warc.gz 6481 download   job
cleaning.12371.cn-inf-20200710-173213-9h4mm-00000.warc.os.cdx.gz 261 download
cleaning.12371.cn-inf-20200710-173213-9h4mm-meta.warc.gz 3535 download   job
cleaning.12371.cn-inf-20200710-173213-9h4mm-meta.warc.os.cdx.gz 47 download
cleaning.12371.cn-inf-20200710-173213-9h4mm.json 246 download   job
cliqz.com-inf-20200501-194732-82yzf-00245.warc.gz 5374446968 download   job
cliqz.com-inf-20200501-194732-82yzf-00245.warc.os.cdx.gz 3170002 download
dianxing.12371.cn-inf-20200710-173822-9qnns-00000.warc.gz 192992247 download   job
dianxing.12371.cn-inf-20200710-173822-9qnns-00000.warc.os.cdx.gz 287529 download
dianxing.12371.cn-inf-20200710-173822-9qnns-meta.warc.gz 159319 download   job
dianxing.12371.cn-inf-20200710-173822-9qnns-meta.warc.os.cdx.gz 47 download
dianxing.12371.cn-inf-20200710-173822-9qnns.json 246 download   job
dianzan.12371.cn-inf-20200710-173337-dyeh7-00000.warc.gz 5842 download   job
dianzan.12371.cn-inf-20200710-173337-dyeh7-00000.warc.os.cdx.gz 258 download
dianzan.12371.cn-inf-20200710-173337-dyeh7-meta.warc.gz 3506 download   job
dianzan.12371.cn-inf-20200710-173337-dyeh7-meta.warc.os.cdx.gz 47 download
dianzan.12371.cn-inf-20200710-173337-dyeh7.json 245 download   job
download.12371.cn-inf-20200710-173402-7360r-00000.warc.gz 6576 download   job
download.12371.cn-inf-20200710-173402-7360r-00000.warc.os.cdx.gz 289 download
download.12371.cn-inf-20200710-173402-7360r-meta.warc.gz 3536 download   job
download.12371.cn-inf-20200710-173402-7360r-meta.warc.os.cdx.gz 47 download
download.12371.cn-inf-20200710-173402-7360r.json 246 download   job
download.12371.cn-inf-20200710-173458-wb2qx-00000.warc.gz 3704667039 download   job
download.12371.cn-inf-20200710-173458-wb2qx-00000.warc.os.cdx.gz 495 download
download.12371.cn-inf-20200710-173458-wb2qx-meta.warc.gz 3698 download   job
download.12371.cn-inf-20200710-173458-wb2qx-meta.warc.os.cdx.gz 47 download
download.12371.cn-inf-20200710-173458-wb2qx.json 257 download   job
ele.xuexi.12371.cn-inf-20200710-180809-9kjm0-00000.warc.gz 2477 download   job
ele.xuexi.12371.cn-inf-20200710-180809-9kjm0-00000.warc.os.cdx.gz 47 download
ele.xuexi.12371.cn-inf-20200710-180809-9kjm0-meta.warc.gz 3576 download   job
ele.xuexi.12371.cn-inf-20200710-180809-9kjm0-meta.warc.os.cdx.gz 47 download
ele.xuexi.12371.cn-inf-20200710-180809-9kjm0.json 247 download   job
forums.bohemia.net-inf-20200603-013635-egbvu-00091.warc.gz 5418949801 download   job
forums.bohemia.net-inf-20200603-013635-egbvu-00091.warc.os.cdx.gz 6862722 download
fuwu.12371.cn-inf-20200710-175509-8rz9v-00000.warc.gz 4476094 download   job
fuwu.12371.cn-inf-20200710-175509-8rz9v-00000.warc.os.cdx.gz 11687 download
fuwu.12371.cn-inf-20200710-175509-8rz9v-meta.warc.gz 10564 download   job
fuwu.12371.cn-inf-20200710-175509-8rz9v-meta.warc.os.cdx.gz 47 download
fuwu.12371.cn-inf-20200710-175509-8rz9v.json 242 download   job
getsatisfaction.com-inf-20200708-234031-epnla-00009.warc.gz 5371892099 download   job
getsatisfaction.com-inf-20200708-234031-epnla-00009.warc.os.cdx.gz 10641910 download
jiaoliu.12371.cn-inf-20200710-175633-q6rhw-00000.warc.gz 505853694 download   job
jiaoliu.12371.cn-inf-20200710-175633-q6rhw-00000.warc.os.cdx.gz 340672 download
jiaoliu.12371.cn-inf-20200710-175633-q6rhw-meta.warc.gz 208371 download   job
jiaoliu.12371.cn-inf-20200710-175633-q6rhw-meta.warc.os.cdx.gz 47 download
jiaoliu.12371.cn-inf-20200710-175633-q6rhw.json 245 download   job
jingda.12371.cn-inf-20200710-180312-aa9yg-00000.warc.gz 1610971 download   job
jingda.12371.cn-inf-20200710-180312-aa9yg-00000.warc.os.cdx.gz 1010 download
jingda.12371.cn-inf-20200710-180312-aa9yg-meta.warc.gz 4216 download   job
jingda.12371.cn-inf-20200710-180312-aa9yg-meta.warc.os.cdx.gz 47 download
jingda.12371.cn-inf-20200710-180312-aa9yg.json 276 download   job
jingda.12371.cn-inf-20200710-180343-3t33u-00000.warc.gz 3868 download   job
jingda.12371.cn-inf-20200710-180343-3t33u-00000.warc.os.cdx.gz 228 download
jingda.12371.cn-inf-20200710-180343-3t33u-meta.warc.gz 3529 download   job
jingda.12371.cn-inf-20200710-180343-3t33u-meta.warc.os.cdx.gz 47 download
jingda.12371.cn-inf-20200710-180343-3t33u.json 270 download   job
jingda.12371.cn-inf-20200710-180523-3t33u-00000.warc.gz 3726 download   job
jingda.12371.cn-inf-20200710-180523-3t33u-00000.warc.os.cdx.gz 229 download
jingda.12371.cn-inf-20200710-180523-3t33u-meta.warc.gz 3467 download   job
jingda.12371.cn-inf-20200710-180523-3t33u-meta.warc.os.cdx.gz 47 download
jingda.12371.cn-inf-20200710-180523-3t33u.json 270 download   job
jingda.12371.cn-inf-20200710-180603-9s671-00000.warc.gz 11662926 download   job
jingda.12371.cn-inf-20200710-180603-9s671-00000.warc.os.cdx.gz 18344 download
jingda.12371.cn-inf-20200710-180603-9s671-meta.warc.gz 14345 download   job
jingda.12371.cn-inf-20200710-180603-9s671-meta.warc.os.cdx.gz 47 download
jingda.12371.cn-inf-20200710-180603-9s671.json 267 download   job
jingda.12371.cn-inf-20200710-180733-7vdir-00000.warc.gz 6254 download   job
jingda.12371.cn-inf-20200710-180733-7vdir-00000.warc.os.cdx.gz 292 download
jingda.12371.cn-inf-20200710-180733-7vdir-meta.warc.gz 3512 download   job
jingda.12371.cn-inf-20200710-180733-7vdir-meta.warc.os.cdx.gz 47 download
jingda.12371.cn-inf-20200710-180733-7vdir.json 244 download   job
jubao.12377.cn-inf-20200710-180839-c843c-00000.warc.gz 2472 download   job
jubao.12377.cn-inf-20200710-180839-c843c-00000.warc.os.cdx.gz 47 download
jubao.12377.cn-inf-20200710-180839-c843c-meta.warc.gz 3523 download   job
jubao.12377.cn-inf-20200710-180839-c843c-meta.warc.os.cdx.gz 47 download
jubao.12377.cn-inf-20200710-180839-c843c.json 243 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00067.warc.gz 5429853662 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00067.warc.os.cdx.gz 233639 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00068.warc.gz 5486769984 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00068.warc.os.cdx.gz 5359 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00069.warc.gz 5372033709 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00069.warc.os.cdx.gz 53719 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00070.warc.gz 5509080630 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00070.warc.os.cdx.gz 7772 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00071.warc.gz 5552956220 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00071.warc.os.cdx.gz 8093 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00073.warc.gz 5821118606 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00073.warc.os.cdx.gz 9980 download
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00074.warc.gz 6080927493 download   job
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00074.warc.os.cdx.gz 11164 download
music.yandex-shallow-20200710-175650-5s0h4-00000.warc.gz 1084033 download   job
music.yandex-shallow-20200710-175650-5s0h4-00000.warc.os.cdx.gz 5667 download
music.yandex-shallow-20200710-175650-5s0h4-meta.warc.gz 6471 download   job
music.yandex-shallow-20200710-175650-5s0h4-meta.warc.os.cdx.gz 47 download
music.yandex-shallow-20200710-175650-5s0h4.json 251 download   job
music.yandex-shallow-20200710-175653-bimi2-00000.warc.gz 1084206 download   job
music.yandex-shallow-20200710-175653-bimi2-00000.warc.os.cdx.gz 5666 download
music.yandex-shallow-20200710-175653-bimi2-meta.warc.gz 6433 download   job
music.yandex-shallow-20200710-175653-bimi2-meta.warc.os.cdx.gz 47 download
music.yandex-shallow-20200710-175653-bimi2.json 246 download   job
music.yandex.com-shallow-20200710-175639-2lldf-00000.warc.gz 1083390 download   job
music.yandex.com-shallow-20200710-175639-2lldf-00000.warc.os.cdx.gz 5637 download
music.yandex.com-shallow-20200710-175639-2lldf-meta.warc.gz 6459 download   job
music.yandex.com-shallow-20200710-175639-2lldf-meta.warc.os.cdx.gz 47 download
music.yandex.com-shallow-20200710-175639-2lldf.json 255 download   job
music.yandex.com-shallow-20200710-175643-52all-00000.warc.gz 1083579 download   job
music.yandex.com-shallow-20200710-175643-52all-00000.warc.os.cdx.gz 5642 download
music.yandex.com-shallow-20200710-175643-52all-meta.warc.gz 6478 download   job
music.yandex.com-shallow-20200710-175643-52all-meta.warc.os.cdx.gz 47 download
music.yandex.com-shallow-20200710-175643-52all.json 250 download   job
music.yandex.ru-shallow-20200710-175634-byfjs-00000.warc.gz 1083491 download   job
music.yandex.ru-shallow-20200710-175634-byfjs-00000.warc.os.cdx.gz 5659 download
music.yandex.ru-shallow-20200710-175634-byfjs-meta.warc.gz 6457 download   job
music.yandex.ru-shallow-20200710-175634-byfjs-meta.warc.os.cdx.gz 47 download
music.yandex.ru-shallow-20200710-175634-byfjs.json 254 download   job
music.yandex.ru-shallow-20200710-175637-4u6vh-00000.warc.gz 1083221 download   job
music.yandex.ru-shallow-20200710-175637-4u6vh-00000.warc.os.cdx.gz 5642 download
music.yandex.ru-shallow-20200710-175637-4u6vh-meta.warc.gz 6415 download   job
music.yandex.ru-shallow-20200710-175637-4u6vh-meta.warc.os.cdx.gz 47 download
music.yandex.ru-shallow-20200710-175637-4u6vh.json 249 download   job
my.12371.cn-inf-20200710-175709-6r3lp-00000.warc.gz 2461 download   job
my.12371.cn-inf-20200710-175709-6r3lp-00000.warc.os.cdx.gz 47 download
my.12371.cn-inf-20200710-175709-6r3lp-meta.warc.gz 3520 download   job
my.12371.cn-inf-20200710-175709-6r3lp-meta.warc.os.cdx.gz 47 download
my.12371.cn-inf-20200710-175709-6r3lp.json 240 download   job
news.12371.cn-inf-20200710-175723-1ib3j-00000.warc.gz 4475712 download   job
news.12371.cn-inf-20200710-175723-1ib3j-00000.warc.os.cdx.gz 11662 download
news.12371.cn-inf-20200710-175723-1ib3j-meta.warc.gz 10450 download   job
news.12371.cn-inf-20200710-175723-1ib3j-meta.warc.os.cdx.gz 47 download
news.12371.cn-inf-20200710-175723-1ib3j.json 242 download   job
org.12377.cn-inf-20200710-174957-ayfet-00000.warc.gz 1610151314 download   job
org.12377.cn-inf-20200710-174957-ayfet-00000.warc.os.cdx.gz 483017 download
org.12377.cn-inf-20200710-174957-ayfet-meta.warc.gz 311560 download   job
org.12377.cn-inf-20200710-174957-ayfet-meta.warc.os.cdx.gz 47 download
org.12377.cn-inf-20200710-174957-ayfet.json 241 download   job
player.fm-inf-20200501-233943-6recr-00678.warc.gz 5410753056 download   job
player.fm-inf-20200501-233943-6recr-00678.warc.os.cdx.gz 250276 download
res.zhibu.12371.cn-inf-20200710-180823-dtofw-00000.warc.gz 2476 download   job
res.zhibu.12371.cn-inf-20200710-180823-dtofw-00000.warc.os.cdx.gz 47 download
res.zhibu.12371.cn-inf-20200710-180823-dtofw-meta.warc.gz 3576 download   job
res.zhibu.12371.cn-inf-20200710-180823-dtofw-meta.warc.os.cdx.gz 47 download
res.zhibu.12371.cn-inf-20200710-180823-dtofw.json 247 download   job
search.12371.cn-inf-20200710-175823-7uz8h-00000.warc.gz 66132 download   job
search.12371.cn-inf-20200710-175823-7uz8h-00000.warc.os.cdx.gz 712 download
search.12371.cn-inf-20200710-175823-7uz8h-meta.warc.gz 4196 download   job
search.12371.cn-inf-20200710-175823-7uz8h-meta.warc.os.cdx.gz 47 download
search.12371.cn-inf-20200710-175823-7uz8h.json 244 download   job
search.12371.cn-inf-20200710-175929-tjo2m-00000.warc.gz 64977 download   job
search.12371.cn-inf-20200710-175929-tjo2m-00000.warc.os.cdx.gz 659 download
search.12371.cn-inf-20200710-175929-tjo2m-meta.warc.gz 4156 download   job
search.12371.cn-inf-20200710-175929-tjo2m-meta.warc.os.cdx.gz 47 download
search.12371.cn-inf-20200710-175929-tjo2m-wpull.log.gz 1466 download
search.12371.cn-inf-20200710-175929-tjo2m.json 254 download   job
testpassport.12371.cn-inf-20200710-180752-c6vvu-00000.warc.gz 2481 download   job
testpassport.12371.cn-inf-20200710-180752-c6vvu-00000.warc.os.cdx.gz 47 download
testpassport.12371.cn-inf-20200710-180752-c6vvu-meta.warc.gz 3592 download   job
testpassport.12371.cn-inf-20200710-180752-c6vvu-meta.warc.os.cdx.gz 47 download
testpassport.12371.cn-inf-20200710-180752-c6vvu.json 250 download   job
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn-00000.warc.gz 63108872 download   job
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn-00000.warc.os.cdx.gz 69523 download
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn-meta.warc.gz 41158 download   job
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn-urls.txt 28764 download
urls-archive.max.fan-twitter-@PNUDGuinee-filtered.txt-shallow-20200710-182941-d5pkn.json 335 download   job
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3-00000.warc.gz 156159284 download   job
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3-00000.warc.os.cdx.gz 393567 download
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3-meta.warc.gz 209194 download   job
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3-urls.txt 21945 download
urls-archive.max.fan-twitter-@POTUS-filtered.txt-shallow-20200710-182637-chan3.json 325 download   job
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf-00000.warc.gz 82513302 download   job
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf-00000.warc.os.cdx.gz 300725 download
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf-meta.warc.gz 159888 download   job
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf-urls.txt 17820 download
urls-archive.max.fan-twitter-@POTUS44-filtered.txt-shallow-20200710-182638-9iujf.json 329 download   job
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi-00000.warc.gz 951406209 download   job
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi-00000.warc.os.cdx.gz 1291669 download
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi-meta.warc.gz 681907 download   job
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi-urls.txt 186298 download
urls-archive.max.fan-twitter-@PR_Senegal-filtered.txt-shallow-20200710-173555-290fi.json 335 download   job
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y-00000.warc.gz 48196241 download   job
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y-00000.warc.os.cdx.gz 52062 download
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y-meta.warc.gz 32368 download   job
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y-urls.txt 14123 download
urls-archive.max.fan-twitter-@PetroglyphNPS-filtered.txt-shallow-20200710-184858-d345y.json 341 download   job
urls-archive.max.fan-twitter-@PhilSDGs-filtered.txt-shallow-20200710-183508-b9n06-urls.txt 154131 download
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e-00000.warc.gz 307746993 download   job
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e-00000.warc.os.cdx.gz 261278 download
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e-meta.warc.gz 143159 download   job
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e-urls.txt 126977 download
urls-archive.max.fan-twitter-@PhilScott4VT-filtered.txt-shallow-20200710-183538-dld8e.json 339 download   job
urls-archive.max.fan-twitter-@PhilipHammondUK-filtered.txt-shallow-20200710-183715-7mjlz-meta.warc.gz 708299 download   job
urls-archive.max.fan-twitter-@PhilipHammondUK-filtered.txt-shallow-20200710-183715-7mjlz-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar-00000.warc.gz 63765291 download   job
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar-00000.warc.os.cdx.gz 73005 download
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar-meta.warc.gz 43812 download   job
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar-urls.txt 41293 download
urls-archive.max.fan-twitter-@PineTreeLegal-filtered.txt-shallow-20200710-183049-7qvar.json 341 download   job
urls-archive.max.fan-twitter-@PlacerCA-filtered.txt-shallow-20200710-183047-25mtl-00000.warc.gz 808305998 download   job
urls-archive.max.fan-twitter-@PlacerCA-filtered.txt-shallow-20200710-183047-25mtl-00000.warc.os.cdx.gz 613156 download
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2-00000.warc.gz 77782143 download   job
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2-00000.warc.os.cdx.gz 68024 download
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2-meta.warc.gz 40369 download   job
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2-urls.txt 19095 download
urls-archive.max.fan-twitter-@PmTunisia-filtered.txt-shallow-20200710-183033-9flh2.json 333 download   job
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r-00000.warc.gz 50523656 download   job
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r-00000.warc.os.cdx.gz 83541 download
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r-meta.warc.gz 48647 download   job
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r-urls.txt 15451 download
urls-archive.max.fan-twitter-@Portugal_UN-filtered.txt-shallow-20200710-182707-9eq8r.json 337 download   job
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f-00000.warc.gz 62250395 download   job
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f-00000.warc.os.cdx.gz 89580 download
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f-meta.warc.gz 52170 download   job
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f-urls.txt 15791 download
urls-archive.max.fan-twitter-@PresParkNPS-filtered.txt-shallow-20200710-174714-4730f.json 337 download   job
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre-00000.warc.gz 433607023 download   job
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre-00000.warc.os.cdx.gz 568036 download
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre-meta.warc.gz 300443 download   job
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre-urls.txt 171400 download
urls-archive.max.fan-twitter-@PresidenceGA-filtered.txt-shallow-20200710-182635-8rcre.json 339 download   job
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m-00000.warc.gz 45910468 download   job
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m-00000.warc.os.cdx.gz 117183 download
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m-meta.warc.gz 65931 download   job
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m-urls.txt 8619 download
urls-archive.max.fan-twitter-@PresidenceHT-filtered.txt-shallow-20200710-182634-1vp1m.json 339 download   job
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2-00000.warc.gz 634113925 download   job
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2-00000.warc.os.cdx.gz 819370 download
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2-meta.warc.gz 423960 download   job
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2-urls.txt 176289 download
urls-archive.max.fan-twitter-@PresidenceNiger-filtered.txt-shallow-20200710-181458-4c0p2.json 345 download   job
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh-00000.warc.gz 289506173 download   job
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh-00000.warc.os.cdx.gz 583564 download
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh-meta.warc.gz 309823 download   job
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh-urls.txt 91863 download
urls-archive.max.fan-twitter-@PresidentABO-filtered.txt-shallow-20200710-181456-3i7zh.json 339 download   job
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h-00000.warc.gz 376473414 download   job
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h-00000.warc.os.cdx.gz 795504 download
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h-meta.warc.gz 426181 download   job
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h-urls.txt 86803 download
urls-archive.max.fan-twitter-@PresidentRuvi-filtered.txt-shallow-20200710-174930-7827h.json 341 download   job
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb-00000.warc.gz 620085557 download   job
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb-00000.warc.os.cdx.gz 1891850 download
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb-meta.warc.gz 984006 download   job
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb-urls.txt 113487 download
urls-archive.max.fan-twitter-@PressSec-filtered.txt-shallow-20200710-174454-bj1fb.json 331 download   job
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl-00000.warc.gz 149475917 download   job
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl-00000.warc.os.cdx.gz 561396 download
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl-meta.warc.gz 301157 download   job
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl-urls.txt 113708 download
urls-archive.max.fan-twitter-@PrivacyProject-filtered.txt-shallow-20200710-174303-1h6dl.json 343 download   job
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr-00000.warc.gz 734708866 download   job
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr-00000.warc.os.cdx.gz 1209347 download
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr-meta.warc.gz 649627 download   job
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr-urls.txt 153122 download
urls-archive.max.fan-twitter-@Puglaas-filtered.txt-shallow-20200710-173527-3bnzr.json 329 download   job
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd-00000.warc.gz 33574366 download   job
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd-00000.warc.os.cdx.gz 78528 download
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd-meta.warc.gz 46757 download   job
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd-urls.txt 23157 download
urls-archive.max.fan-twitter-@RCPaddock-filtered.txt-shallow-20200710-172254-2chwd.json 333 download   job
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e-00000.warc.gz 30086318 download   job
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e-00000.warc.os.cdx.gz 30444 download
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e-meta.warc.gz 20519 download   job
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e-urls.txt 7407 download
urls-archive.max.fan-twitter-@RDMISIONONU-filtered.txt-shallow-20200710-171956-42z5e.json 337 download   job
urls-archive.max.fan-twitter-@RISecState-filtered.txt-shallow-20200710-155333-3img7-meta.warc.gz 396732 download   job
urls-archive.max.fan-twitter-@RISecState-filtered.txt-shallow-20200710-155333-3img7-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RISecState-filtered.txt-shallow-20200710-155333-3img7-urls.txt 248122 download
urls-archive.max.fan-twitter-@RISecState-filtered.txt-shallow-20200710-155333-3img7.json 335 download   job
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t-00000.warc.gz 177309478 download   job
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t-00000.warc.os.cdx.gz 376534 download
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t-meta.warc.gz 202907 download   job
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t-urls.txt 103052 download
urls-archive.max.fan-twitter-@RaR-filtered.txt-shallow-20200710-172515-dwl9t.json 321 download   job
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj-00000.warc.gz 1776460268 download   job
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj-00000.warc.os.cdx.gz 1816633 download
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj-meta.warc.gz 943888 download   job
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj-urls.txt 733069 download
urls-archive.max.fan-twitter-@RadioMiraya-filtered.txt-shallow-20200710-173523-2zwbj.json 337 download   job
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv-00000.warc.gz 22587039 download   job
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv-00000.warc.os.cdx.gz 32820 download
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv-meta.warc.gz 22356 download   job
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv-urls.txt 17688 download
urls-archive.max.fan-twitter-@RafaGCS-filtered.txt-shallow-20200710-172819-9apxv.json 329 download   job
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj-00000.warc.gz 133308503 download   job
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj-00000.warc.os.cdx.gz 143607 download
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj-meta.warc.gz 79409 download   job
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj-urls.txt 42743 download
urls-archive.max.fan-twitter-@RapidResponse-filtered.txt-shallow-20200710-172520-9g4yj.json 341 download   job
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo-00000.warc.gz 85795602 download   job
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo-00000.warc.os.cdx.gz 229886 download
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo-meta.warc.gz 126371 download   job
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo-urls.txt 14599 download
urls-archive.max.fan-twitter-@RaulGonzalez-filtered.txt-shallow-20200710-172409-7kcwo.json 339 download   job
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t-00000.warc.gz 483640190 download   job
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t-00000.warc.os.cdx.gz 1991861 download
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t-meta.warc.gz 1066196 download   job
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t-urls.txt 145398 download
urls-archive.max.fan-twitter-@RealBenCarson-filtered.txt-shallow-20200710-171547-7tu3t.json 341 download   job
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v-00000.warc.gz 54564143 download   job
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v-00000.warc.os.cdx.gz 101200 download
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v-meta.warc.gz 58968 download   job
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v-urls.txt 22831 download
urls-archive.max.fan-twitter-@RebeccaKatz5-filtered.txt-shallow-20200710-171000-5y58v.json 339 download   job
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o-00000.warc.gz 229911677 download   job
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o-00000.warc.os.cdx.gz 214356 download
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o-meta.warc.gz 116917 download   job
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o-urls.txt 102506 download
urls-archive.max.fan-twitter-@RedCrossENC-filtered.txt-shallow-20200710-170956-aa68o.json 337 download   job
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m-00000.warc.gz 1696959 download   job
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m-00000.warc.os.cdx.gz 4635 download
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m-meta.warc.gz 6455 download   job
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m-urls.txt 806 download
urls-archive.max.fan-twitter-@RefugeeAwareNet-filtered.txt-shallow-20200710-170917-bg75m.json 345 download   job
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f-00000.warc.gz 2161663 download   job
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f-00000.warc.os.cdx.gz 5205 download
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f-meta.warc.gz 6748 download   job
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f-urls.txt 1254 download
urls-archive.max.fan-twitter-@RefugeeUSA-filtered.txt-shallow-20200710-170730-bqr1f.json 335 download   job
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls-00000.warc.gz 133862223 download   job
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls-00000.warc.os.cdx.gz 213472 download
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls-meta.warc.gz 117893 download   job
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls-urls.txt 39493 download
urls-archive.max.fan-twitter-@RefugeesRwanda-filtered.txt-shallow-20200710-170732-7psls.json 343 download   job
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy-00000.warc.gz 239416143 download   job
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy-00000.warc.os.cdx.gz 361548 download
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy-meta.warc.gz 195276 download   job
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy-urls.txt 74739 download
urls-archive.max.fan-twitter-@RepAlLawsonJr-filtered.txt-shallow-20200710-170619-8bisy.json 341 download   job
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3-00000.warc.gz 220420514 download   job
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3-00000.warc.os.cdx.gz 482693 download
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3-meta.warc.gz 257982 download   job
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3-urls.txt 62682 download
urls-archive.max.fan-twitter-@RepArmstrongND-filtered.txt-shallow-20200710-170251-60wp3.json 343 download   job
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e-00000.warc.gz 712021372 download   job
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e-00000.warc.os.cdx.gz 1523567 download
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e-meta.warc.gz 796554 download   job
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e-urls.txt 289412 download
urls-archive.max.fan-twitter-@RepBonnie-filtered.txt-shallow-20200710-170249-9329e.json 333 download   job
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4-00000.warc.gz 354872443 download   job
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4-00000.warc.os.cdx.gz 602205 download
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4-meta.warc.gz 319664 download   job
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4-urls.txt 116729 download
urls-archive.max.fan-twitter-@RepBuddyCarter-filtered.txt-shallow-20200710-170247-f10j4.json 343 download   job
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r-00000.warc.gz 1610798188 download   job
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r-00000.warc.os.cdx.gz 2147752 download
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r-meta.warc.gz 1125805 download   job
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r-urls.txt 646727 download
urls-archive.max.fan-twitter-@RepByrne-filtered.txt-shallow-20200710-170245-4fx4r.json 331 download   job
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy-00000.warc.gz 148966998 download   job
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy-00000.warc.os.cdx.gz 284458 download
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy-meta.warc.gz 152941 download   job
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy-urls.txt 42098 download
urls-archive.max.fan-twitter-@RepCarolMiller-filtered.txt-shallow-20200710-170211-9emqy.json 343 download   job
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr-00000.warc.gz 292352207 download   job
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr-00000.warc.os.cdx.gz 526525 download
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr-meta.warc.gz 281381 download   job
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr-urls.txt 97014 download
urls-archive.max.fan-twitter-@RepCasten-filtered.txt-shallow-20200710-170205-41zqr.json 333 download   job
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn-00000.warc.gz 307858733 download   job
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn-00000.warc.os.cdx.gz 855830 download
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn-meta.warc.gz 449163 download   job
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn-urls.txt 128006 download
urls-archive.max.fan-twitter-@RepChipRoy-filtered.txt-shallow-20200710-165836-dhfgn.json 335 download   job
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj-00000.warc.gz 264331883 download   job
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj-00000.warc.os.cdx.gz 517656 download
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj-meta.warc.gz 273625 download   job
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj-urls.txt 86925 download
urls-archive.max.fan-twitter-@RepChuyGarcia-filtered.txt-shallow-20200710-165835-1rvaj.json 341 download   job
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5-00000.warc.gz 48828319 download   job
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5-00000.warc.os.cdx.gz 96811 download
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5-meta.warc.gz 56057 download   job
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5-urls.txt 19740 download
urls-archive.max.fan-twitter-@RepDanBishop-filtered.txt-shallow-20200710-165830-2ebp5.json 339 download   job
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr-00000.warc.gz 191763404 download   job
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr-00000.warc.os.cdx.gz 753586 download
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr-meta.warc.gz 392527 download   job
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr-urls.txt 47430 download
urls-archive.max.fan-twitter-@RepDanCrenshaw-filtered.txt-shallow-20200710-165733-1rjjr.json 343 download   job
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi-00000.warc.gz 803358966 download   job
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi-00000.warc.os.cdx.gz 1129461 download
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi-meta.warc.gz 598698 download   job
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi-urls.txt 282885 download
urls-archive.max.fan-twitter-@RepDeSaulnier-filtered.txt-shallow-20200710-165717-32xwi.json 341 download   job
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx-00000.warc.gz 588876697 download   job
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx-00000.warc.os.cdx.gz 1544424 download
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx-meta.warc.gz 817683 download   job
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx-urls.txt 234616 download
urls-archive.max.fan-twitter-@RepDebDingell-filtered.txt-shallow-20200710-165723-aviwx.json 341 download   job
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l-00000.warc.gz 230628377 download   job
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l-00000.warc.os.cdx.gz 355886 download
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l-meta.warc.gz 189403 download   job
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l-urls.txt 97019 download
urls-archive.max.fan-twitter-@RepDrewFerguson-filtered.txt-shallow-20200710-165716-44i6l.json 345 download   job
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k-00000.warc.gz 253804077 download   job
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k-00000.warc.os.cdx.gz 482459 download
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k-meta.warc.gz 256365 download   job
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k-urls.txt 69418 download
urls-archive.max.fan-twitter-@RepFredKeller-filtered.txt-shallow-20200710-165455-8zs1k.json 341 download   job
urls-archive.max.fan-twitter-@RepGregMurphy-filtered.txt-shallow-20200710-165450-bel5p-00000.warc.gz 50931409 download   job
urls-archive.max.fan-twitter-@RepGregMurphy-filtered.txt-shallow-20200710-165450-bel5p-00000.warc.os.cdx.gz 142118 download
urls-archive.max.fan-twitter-@RepGregMurphy-filtered.txt-shallow-20200710-165450-bel5p-meta.warc.gz 79942 download   job
urls-archive.max.fan-twitter-@RepGregMurphy-filtered.txt-shallow-20200710-165450-bel5p-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepGregMurphy-filtered.txt-shallow-20200710-165450-bel5p-urls.txt 16348 download
urls-archive.max.fan-twitter-@RepGregPence-filtered.txt-shallow-20200710-165445-w22vp-00000.warc.gz 181765320 download   job
urls-archive.max.fan-twitter-@RepGregPence-filtered.txt-shallow-20200710-165445-w22vp-00000.warc.os.cdx.gz 305979 download
urls-archive.max.fan-twitter-@RepGregPence-filtered.txt-shallow-20200710-165445-w22vp-meta.warc.gz 163694 download   job
urls-archive.max.fan-twitter-@RepGregPence-filtered.txt-shallow-20200710-165445-w22vp-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepGregPence-filtered.txt-shallow-20200710-165445-w22vp-urls.txt 47100 download
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh-00000.warc.gz 127654792 download   job
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh-00000.warc.os.cdx.gz 372695 download
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh-meta.warc.gz 199411 download   job
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh-urls.txt 46116 download
urls-archive.max.fan-twitter-@RepGregSteube-filtered.txt-shallow-20200710-165050-d7roh.json 341 download   job
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p-00000.warc.gz 574631583 download   job
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p-00000.warc.os.cdx.gz 615613 download
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p-meta.warc.gz 326650 download   job
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p-urls.txt 134075 download
urls-archive.max.fan-twitter-@RepGrothman-filtered.txt-shallow-20200710-165041-26w1p.json 337 download   job
urls-archive.max.fan-twitter-@RepHagedorn-filtered.txt-shallow-20200710-165036-3yl6j-00000.warc.gz 169973821 download   job
urls-archive.max.fan-twitter-@RepHagedorn-filtered.txt-shallow-20200710-165036-3yl6j-00000.warc.os.cdx.gz 231487 download
urls-archive.max.fan-twitter-@RepHagedorn-filtered.txt-shallow-20200710-165036-3yl6j-meta.warc.gz 126141 download   job
urls-archive.max.fan-twitter-@RepHagedorn-filtered.txt-shallow-20200710-165036-3yl6j-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepHagedorn-filtered.txt-shallow-20200710-165036-3yl6j-urls.txt 51979 download
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2-00000.warc.gz 62702626 download   job
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2-00000.warc.os.cdx.gz 88690 download
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2-meta.warc.gz 51979 download   job
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2-urls.txt 18880 download
urls-archive.max.fan-twitter-@RepJimBaird-filtered.txt-shallow-20200710-165036-dyvb2.json 337 download   job
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj-00000.warc.gz 200923675 download   job
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj-00000.warc.os.cdx.gz 312730 download
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj-meta.warc.gz 166657 download   job
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj-urls.txt 50220 download
urls-archive.max.fan-twitter-@RepJohnJoyce-filtered.txt-shallow-20200710-165034-48pfj.json 339 download   job
urls-archive.max.fan-twitter-@RepJohnKatko-filtered.txt-shallow-20200710-164817-dmka3-meta.warc.gz 164848 download   job
urls-archive.max.fan-twitter-@RepJohnKatko-filtered.txt-shallow-20200710-164817-dmka3-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepJohnKatko-filtered.txt-shallow-20200710-164817-dmka3-urls.txt 47663 download
urls-archive.max.fan-twitter-@RepJohnKatko-filtered.txt-shallow-20200710-164817-dmka3.json 339 download   job
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h-00000.warc.gz 113563115 download   job
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h-00000.warc.os.cdx.gz 131161 download
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h-meta.warc.gz 73784 download   job
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h-urls.txt 25960 download
urls-archive.max.fan-twitter-@RepJohnRose-filtered.txt-shallow-20200710-164810-aly1h.json 337 download   job
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk-00000.warc.gz 375295359 download   job
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk-00000.warc.os.cdx.gz 916252 download
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk-meta.warc.gz 481213 download   job
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk-urls.txt 180560 download
urls-archive.max.fan-twitter-@RepKathleenRice-filtered.txt-shallow-20200710-164413-7vnjk.json 345 download   job
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx-00000.warc.gz 166312634 download   job
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx-00000.warc.os.cdx.gz 346897 download
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx-meta.warc.gz 188895 download   job
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx-urls.txt 50081 download
urls-archive.max.fan-twitter-@RepKendraHorn-filtered.txt-shallow-20200710-164411-6iybx.json 341 download   job
urls-archive.max.fan-twitter-@RepLucyMcBath-filtered.txt-shallow-20200710-164403-8hcfa-00000.warc.gz 155735941 download   job
urls-archive.max.fan-twitter-@RepLucyMcBath-filtered.txt-shallow-20200710-164403-8hcfa-00000.warc.os.cdx.gz 415364 download
urls-archive.max.fan-twitter-@RepLucyMcBath-filtered.txt-shallow-20200710-164403-8hcfa-meta.warc.gz 222650 download   job
urls-archive.max.fan-twitter-@RepLucyMcBath-filtered.txt-shallow-20200710-164403-8hcfa-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepLucyMcBath-filtered.txt-shallow-20200710-164403-8hcfa-urls.txt 43554 download
urls-archive.max.fan-twitter-@RepMarkTakai-filtered.txt-shallow-20200710-164324-1q8oh-urls.txt 28910 download
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt-00000.warc.gz 1283672784 download   job
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt-00000.warc.os.cdx.gz 3219198 download
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt-meta.warc.gz 1684086 download   job
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt-urls.txt 251007 download
urls-archive.max.fan-twitter-@RepMattGaetz-filtered.txt-shallow-20200710-164252-einrt.json 339 download   job
urls-archive.max.fan-twitter-@RepMeuser-filtered.txt-shallow-20200710-164249-2sog7-00000.warc.gz 124521317 download   job
urls-archive.max.fan-twitter-@RepMeuser-filtered.txt-shallow-20200710-164249-2sog7-00000.warc.os.cdx.gz 270798 download
urls-archive.max.fan-twitter-@RepMeuser-filtered.txt-shallow-20200710-164249-2sog7-urls.txt 40299 download
urls-archive.max.fan-twitter-@RepMeuser-filtered.txt-shallow-20200710-164249-2sog7.json 333 download   job
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93-00000.warc.gz 95732744 download   job
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93-00000.warc.os.cdx.gz 206312 download
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93-meta.warc.gz 114020 download   job
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93-urls.txt 37233 download
urls-archive.max.fan-twitter-@RepMichaelGuest-filtered.txt-shallow-20200710-164213-ahd93.json 345 download   job
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2-00000.warc.gz 407233315 download   job
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2-00000.warc.os.cdx.gz 803764 download
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2-meta.warc.gz 424115 download   job
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2-urls.txt 123228 download
urls-archive.max.fan-twitter-@RepMichaelWaltz-filtered.txt-shallow-20200710-164212-d33f2.json 345 download   job
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw-00000.warc.gz 5481538 download   job
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw-00000.warc.os.cdx.gz 18073 download
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw-meta.warc.gz 13938 download   job
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw-urls.txt 1830 download
urls-archive.max.fan-twitter-@RepMikeGarcia-filtered.txt-shallow-20200710-162713-co7gw.json 341 download   job
urls-archive.max.fan-twitter-@RepRickAllen-filtered.txt-shallow-20200710-162712-e0mei-00000.warc.gz 306047953 download   job
urls-archive.max.fan-twitter-@RepRickAllen-filtered.txt-shallow-20200710-162712-e0mei-00000.warc.os.cdx.gz 445227 download
urls-archive.max.fan-twitter-@RepRickAllen-filtered.txt-shallow-20200710-162712-e0mei-meta.warc.gz 240260 download   job
urls-archive.max.fan-twitter-@RepRickAllen-filtered.txt-shallow-20200710-162712-e0mei-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepRickAllen-filtered.txt-shallow-20200710-162712-e0mei.json 339 download   job
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx-00000.warc.gz 344877111 download   job
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx-00000.warc.os.cdx.gz 506155 download
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx-meta.warc.gz 274244 download   job
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx-urls.txt 93120 download
urls-archive.max.fan-twitter-@RepRiggleman-filtered.txt-shallow-20200710-162711-2h7kx.json 339 download   job
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda-00000.warc.gz 168801170 download   job
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda-00000.warc.os.cdx.gz 354284 download
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda-meta.warc.gz 192444 download   job
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda-urls.txt 50460 download
urls-archive.max.fan-twitter-@RepRonWright-filtered.txt-shallow-20200710-162711-5gyda.json 339 download   job
urls-archive.max.fan-twitter-@RepRossSpano-filtered.txt-shallow-20200710-162710-710fl-00000.warc.gz 163109892 download   job
urls-archive.max.fan-twitter-@RepRossSpano-filtered.txt-shallow-20200710-162710-710fl-00000.warc.os.cdx.gz 279731 download
urls-archive.max.fan-twitter-@RepRossSpano-filtered.txt-shallow-20200710-162710-710fl-meta.warc.gz 152829 download   job
urls-archive.max.fan-twitter-@RepRossSpano-filtered.txt-shallow-20200710-162710-710fl-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepRossSpano-filtered.txt-shallow-20200710-162710-710fl-urls.txt 42540 download
urls-archive.max.fan-twitter-@RepRussell-filtered.txt-shallow-20200710-161354-8uhhp.json 335 download   job
urls-archive.max.fan-twitter-@RepRutherfordFL-filtered.txt-shallow-20200710-161352-16kt8-00000.warc.gz 191539937 download   job
urls-archive.max.fan-twitter-@RepRutherfordFL-filtered.txt-shallow-20200710-161352-16kt8-00000.warc.os.cdx.gz 418379 download
urls-archive.max.fan-twitter-@RepRutherfordFL-filtered.txt-shallow-20200710-161352-16kt8-urls.txt 70155 download
urls-archive.max.fan-twitter-@RepRutherfordFL-filtered.txt-shallow-20200710-161352-16kt8.json 345 download   job
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr-00000.warc.gz 1602294491 download   job
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr-00000.warc.os.cdx.gz 5019031 download
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr-meta.warc.gz 2594502 download   job
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr-urls.txt 577525 download
urls-archive.max.fan-twitter-@RepSwalwell-filtered.txt-shallow-20200710-161351-338pr.json 337 download   job
urls-archive.max.fan-twitter-@RepTedLieu-filtered.txt-shallow-20200710-161239-aq2nr-00000.warc.gz 630008927 download   job
urls-archive.max.fan-twitter-@RepTedLieu-filtered.txt-shallow-20200710-161239-aq2nr-00000.warc.os.cdx.gz 1967903 download
urls-archive.max.fan-twitter-@RepTedLieu-filtered.txt-shallow-20200710-161239-aq2nr-urls.txt 205654 download
urls-archive.max.fan-twitter-@RepTedLieu-filtered.txt-shallow-20200710-161239-aq2nr.json 335 download   job
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd-00000.warc.gz 305890961 download   job
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd-00000.warc.os.cdx.gz 650834 download
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd-meta.warc.gz 349778 download   job
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd-urls.txt 87940 download
urls-archive.max.fan-twitter-@RepTedYoho-filtered.txt-shallow-20200710-161238-cnymd.json 335 download   job
urls-archive.max.fan-twitter-@RepTiffany-filtered.txt-shallow-20200710-160753-6x3ap-00000.warc.gz 3878025 download   job
urls-archive.max.fan-twitter-@RepTiffany-filtered.txt-shallow-20200710-160753-6x3ap-00000.warc.os.cdx.gz 13352 download
urls-archive.max.fan-twitter-@RepTiffany-filtered.txt-shallow-20200710-160753-6x3ap-meta.warc.gz 11427 download   job
urls-archive.max.fan-twitter-@RepTiffany-filtered.txt-shallow-20200710-160753-6x3ap-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepTiffany-filtered.txt-shallow-20200710-160753-6x3ap-urls.txt 986 download
urls-archive.max.fan-twitter-@RepTiffany_-filtered.txt-shallow-20200710-160750-25jk8-00000.warc.gz 1456259 download   job
urls-archive.max.fan-twitter-@RepTiffany_-filtered.txt-shallow-20200710-160750-25jk8-00000.warc.os.cdx.gz 4590 download
urls-archive.max.fan-twitter-@RepTiffany_-filtered.txt-shallow-20200710-160750-25jk8-meta.warc.gz 6431 download   job
urls-archive.max.fan-twitter-@RepTiffany_-filtered.txt-shallow-20200710-160750-25jk8-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RepTiffany_-filtered.txt-shallow-20200710-160750-25jk8.json 337 download   job
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we-00000.warc.gz 35597672 download   job
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we-00000.warc.os.cdx.gz 135396 download
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we-meta.warc.gz 76302 download   job
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we-urls.txt 15246 download
urls-archive.max.fan-twitter-@ReverendWarnock-filtered.txt-shallow-20200710-160750-231we.json 345 download   job
urls-archive.max.fan-twitter-@RhodeIslandGOP-filtered.txt-shallow-20200710-160052-59njl-00000.warc.gz 614116227 download   job
urls-archive.max.fan-twitter-@RhodeIslandGOP-filtered.txt-shallow-20200710-160052-59njl-00000.warc.os.cdx.gz 594186 download
urls-archive.max.fan-twitter-@RhodeIslandGOP-filtered.txt-shallow-20200710-160052-59njl-meta.warc.gz 319669 download   job
urls-archive.max.fan-twitter-@RhodeIslandGOP-filtered.txt-shallow-20200710-160052-59njl-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RhodeIslandGOP-filtered.txt-shallow-20200710-160052-59njl-urls.txt 408242 download
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv-00000.warc.gz 393544997 download   job
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv-00000.warc.os.cdx.gz 653277 download
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv-meta.warc.gz 348981 download   job
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv-urls.txt 258238 download
urls-archive.max.fan-twitter-@RichardFausset-filtered.txt-shallow-20200710-160049-2m0cv.json 343 download   job
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m-00000.warc.gz 202142255 download   job
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m-00000.warc.os.cdx.gz 193270 download
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m-meta.warc.gz 107706 download   job
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m-urls.txt 75579 download
urls-archive.max.fan-twitter-@RickettsForGov-filtered.txt-shallow-20200710-155603-9zv8m.json 343 download   job
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4-00000.warc.gz 153459854 download   job
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4-00000.warc.os.cdx.gz 155934 download
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4-meta.warc.gz 88199 download   job
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4-urls.txt 66949 download
urls-archive.max.fan-twitter-@RioPavilion-filtered.txt-shallow-20200710-155601-7ons4.json 337 download   job
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy-00000.warc.gz 3583898143 download   job
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy-00000.warc.os.cdx.gz 7285919 download
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy-meta.warc.gz 3819932 download   job
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy-urls.txt 2719185 download
urls-archive.max.fan-twitter-@RorySmith-filtered.txt-shallow-20200710-153938-bfjjy.json 333 download   job
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g-00000.warc.gz 2670169441 download   job
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g-00000.warc.os.cdx.gz 3362898 download
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g-meta.warc.gz 1762152 download   job
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g-urls.txt 1917152 download
urls-archive.max.fan-twitter-@RussContreras-filtered.txt-shallow-20200710-145606-aby5g.json 341 download   job
urls-archive.max.fan-twitter-@RussiaUN-filtered.txt-shallow-20200710-145603-d8me9-00000.warc.gz 1454579194 download   job
urls-archive.max.fan-twitter-@RussiaUN-filtered.txt-shallow-20200710-145603-d8me9-00000.warc.os.cdx.gz 2288179 download
urls-archive.max.fan-twitter-@RussiaUN-filtered.txt-shallow-20200710-145603-d8me9.json 331 download   job
urls-archive.max.fan-twitter-@SCT_mx-filtered.txt-shallow-20200710-131052-6bzgb-00000.warc.gz 5368718760 download   job
urls-archive.max.fan-twitter-@SCT_mx-filtered.txt-shallow-20200710-131052-6bzgb-00000.warc.os.cdx.gz 7326445 download
urls-archive.max.fan-twitter-@SCT_mx-filtered.txt-shallow-20200710-131052-6bzgb-meta.warc.gz 4944300 download   job
urls-archive.max.fan-twitter-@SCT_mx-filtered.txt-shallow-20200710-131052-6bzgb-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@SEDENAmx-filtered.txt-shallow-20200710-115757-5nx7q-00001.warc.gz 1305215912 download   job
urls-archive.max.fan-twitter-@SEDENAmx-filtered.txt-shallow-20200710-115757-5nx7q-00001.warc.os.cdx.gz 1460744 download
urls-archive.max.fan-twitter-@SEDENAmx-filtered.txt-shallow-20200710-115757-5nx7q-urls.txt 1502971 download
urls-archive.max.fan-twitter-@SEDENAmx-filtered.txt-shallow-20200710-115757-5nx7q.json 331 download   job
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00000.warc.gz 5368827645 download   job
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00000.warc.os.cdx.gz 6923615 download
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00001.warc.gz 5369343007 download   job
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00001.warc.os.cdx.gz 2882560 download
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00002.warc.gz 3594984305 download   job
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-00002.warc.os.cdx.gz 3515459 download
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-meta.warc.gz 7012083 download   job
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9-urls.txt 3225890 download
urls-archive.max.fan-twitter-@SEGOB_mx-filtered.txt-shallow-20200710-114640-5e1r9.json 331 download   job
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp-00001.warc.gz 2087371461 download   job
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp-00001.warc.os.cdx.gz 8721999 download
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp-meta.warc.gz 9708421 download   job
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp-urls.txt 3651758 download
urls-archive.max.fan-twitter-@SethAbramson-filtered.txt-shallow-20200710-094942-581qp.json 339 download   job
urls-archive.max.fan-twitter-@pauljweber-filtered.txt-shallow-20200710-192751-c9w7v-urls.txt 6219 download
urls-archive.max.fan-twitter-@pauljweber-filtered.txt-shallow-20200710-192751-c9w7v.json 335 download   job
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69-00000.warc.gz 133613311 download   job
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69-00000.warc.os.cdx.gz 169074 download
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69-meta.warc.gz 95602 download   job
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69-urls.txt 61431 download
urls-archive.max.fan-twitter-@ph_desfosses-filtered.txt-shallow-20200710-183718-3si69.json 339 download   job
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf-00000.warc.gz 7158717 download   job
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf-00000.warc.os.cdx.gz 12567 download
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf-meta.warc.gz 11120 download   job
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf-urls.txt 5080 download
urls-archive.max.fan-twitter-@photojscho-filtered.txt-shallow-20200710-183256-1kmbf.json 335 download   job
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s-00000.warc.gz 114872442 download   job
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s-00000.warc.os.cdx.gz 193076 download
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s-meta.warc.gz 107152 download   job
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s-urls.txt 28970 download
urls-archive.max.fan-twitter-@pololikashvili-filtered.txt-shallow-20200710-182708-21z8s.json 343 download   job
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi-00000.warc.gz 489086023 download   job
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi-00000.warc.os.cdx.gz 862561 download
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi-meta.warc.gz 458589 download   job
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi-urls.txt 415472 download
urls-archive.max.fan-twitter-@porterthereport-filtered.txt-shallow-20200710-182707-8d6fi.json 345 download   job
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk-00000.warc.gz 19494250 download   job
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk-00000.warc.os.cdx.gz 37988 download
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk-meta.warc.gz 24758 download   job
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk-urls.txt 9238 download
urls-archive.max.fan-twitter-@princetongerry-filtered.txt-shallow-20200710-174453-1ulpk.json 343 download   job
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9-00000.warc.gz 724228115 download   job
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9-00000.warc.os.cdx.gz 1001569 download
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9-meta.warc.gz 537285 download   job
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9-urls.txt 407381 download
urls-archive.max.fan-twitter-@profvrr-filtered.txt-shallow-20200710-174041-16mn9.json 329 download   job
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9-00000.warc.gz 70391882 download   job
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9-00000.warc.os.cdx.gz 158664 download
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9-meta.warc.gz 89124 download   job
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9-urls.txt 57338 download
urls-archive.max.fan-twitter-@rachel_dry-filtered.txt-shallow-20200710-173526-d9xj9.json 335 download   job
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq-00000.warc.gz 327706505 download   job
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq-00000.warc.os.cdx.gz 581078 download
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq-meta.warc.gz 306558 download   job
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq-urls.txt 104488 download
urls-archive.max.fan-twitter-@ray_slowbeat-filtered.txt-shallow-20200710-172406-b0neq.json 339 download   job
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3-00000.warc.gz 297904365 download   job
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3-00000.warc.os.cdx.gz 323911 download
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3-meta.warc.gz 174366 download   job
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3-urls.txt 292926 download
urls-archive.max.fan-twitter-@rbfallstromAP-filtered.txt-shallow-20200710-172405-6mow3.json 341 download   job
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl-00000.warc.gz 2837801 download   job
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl-00000.warc.os.cdx.gz 13100 download
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl-meta.warc.gz 11387 download   job
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl-urls.txt 726 download
urls-archive.max.fan-twitter-@rcfp-filtered.txt-shallow-20200710-172257-a9uwl.json 323 download   job
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz-00000.warc.gz 384859954 download   job
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz-00000.warc.os.cdx.gz 398144 download
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz-meta.warc.gz 213316 download   job
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz-urls.txt 332768 download
urls-archive.max.fan-twitter-@rcjonesphoto-filtered.txt-shallow-20200710-172254-d8unz.json 339 download   job
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo-00000.warc.gz 211190649 download   job
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo-00000.warc.os.cdx.gz 497068 download
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo-meta.warc.gz 263395 download   job
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo-urls.txt 165815 download
urls-archive.max.fan-twitter-@readercenter-filtered.txt-shallow-20200710-171550-8fhfo.json 339 download   job
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0-00000.warc.gz 723452423 download   job
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0-00000.warc.os.cdx.gz 646468 download
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0-meta.warc.gz 331807 download   job
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0-urls.txt 745243 download
urls-archive.max.fan-twitter-@realrichardmay-filtered.txt-shallow-20200710-171251-8hik0.json 343 download   job
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux-00000.warc.gz 749124040 download   job
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux-00000.warc.os.cdx.gz 1043635 download
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux-meta.warc.gz 555958 download   job
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux-urls.txt 274523 download
urls-archive.max.fan-twitter-@redditchrachel-filtered.txt-shallow-20200710-170952-4wjux.json 343 download   job
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk-00000.warc.gz 95187207 download   job
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk-00000.warc.os.cdx.gz 239140 download
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk-meta.warc.gz 131486 download   job
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk-urls.txt 53029 download
urls-archive.max.fan-twitter-@refugee_gender-filtered.txt-shallow-20200710-170916-bb8wk.json 343 download   job
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7-00000.warc.gz 238289462 download   job
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7-00000.warc.os.cdx.gz 561819 download
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7-meta.warc.gz 300592 download   job
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7-urls.txt 162368 download
urls-archive.max.fan-twitter-@relucasz-filtered.txt-shallow-20200710-170623-amxo7.json 331 download   job
urls-archive.max.fan-twitter-@renato_mariotti-filtered.txt-shallow-20200710-170623-a94mb-urls.txt 1393434 download
urls-archive.max.fan-twitter-@reynadesai-filtered.txt-shallow-20200710-160715-4wkef-00000.warc.gz 382397109 download   job
urls-archive.max.fan-twitter-@reynadesai-filtered.txt-shallow-20200710-160715-4wkef-00000.warc.os.cdx.gz 369972 download
urls-archive.max.fan-twitter-@reynadesai-filtered.txt-shallow-20200710-160715-4wkef-meta.warc.gz 200015 download   job
urls-archive.max.fan-twitter-@reynadesai-filtered.txt-shallow-20200710-160715-4wkef-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@reynadesai-filtered.txt-shallow-20200710-160715-4wkef.json 335 download   job
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq-00000.warc.gz 64913228 download   job
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq-00000.warc.os.cdx.gz 96364 download
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq-meta.warc.gz 56066 download   job
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq-urls.txt 22048 download
urls-archive.max.fan-twitter-@rfremson-filtered.txt-shallow-20200710-160311-5rxhq.json 331 download   job
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq-00000.warc.gz 716163263 download   job
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq-00000.warc.os.cdx.gz 990302 download
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq-meta.warc.gz 522583 download   job
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq-urls.txt 372165 download
urls-archive.max.fan-twitter-@robportman-filtered.txt-shallow-20200710-155007-4ihoq.json 335 download   job
urls-archive.max.fan-twitter-@robreiner-filtered.txt-shallow-20200710-154153-1w9h8-meta.warc.gz 906006 download   job
urls-archive.max.fan-twitter-@robreiner-filtered.txt-shallow-20200710-154153-1w9h8-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@robreiner-filtered.txt-shallow-20200710-154153-1w9h8-urls.txt 88951 download
urls-archive.max.fan-twitter-@rocionahle-filtered.txt-shallow-20200710-154153-bkrnf-meta.warc.gz 834213 download   job
urls-archive.max.fan-twitter-@rocionahle-filtered.txt-shallow-20200710-154153-bkrnf-meta.warc.os.cdx.gz 47 download
urls-archive.max.fan-twitter-@rocionahle-filtered.txt-shallow-20200710-154153-bkrnf-urls.txt 237917 download
urls-archive.max.fan-twitter-@rocionahle-filtered.txt-shallow-20200710-154153-bkrnf.json 335 download   job
urls-transfer.notkiska.pw-facebook-@EqualityForFlatbush-shallow-20200710-131353-8fl7e-00002.warc.gz 5434525729 download   job
urls-transfer.notkiska.pw-facebook-@EqualityForFlatbush-shallow-20200710-131353-8fl7e-00002.warc.os.cdx.gz 611107 download
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00102.warc.gz 5369131423 download   job
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00102.warc.os.cdx.gz 1508279 download
urls-transfer.notkiska.pw-twitter-%23schoolsreopening-shallow-20200709-165902-2kyn5-00017.warc.gz 5375682728 download   job
urls-transfer.notkiska.pw-twitter-%23schoolsreopening-shallow-20200709-165902-2kyn5-00017.warc.os.cdx.gz 3072875 download
urls-transfer.notkiska.pw-twitter-@EqualFlatbush-shallow-20200710-130411-a3k90-meta.warc.gz 2136042 download   job
urls-transfer.notkiska.pw-twitter-@EqualFlatbush-shallow-20200710-130411-a3k90-meta.warc.os.cdx.gz 47 download
urls-transfer.notkiska.pw-twitter-@EqualFlatbush-shallow-20200710-130411-a3k90-urls.txt 757922 download
urls-transfer.notkiska.pw-twitter-@EqualFlatbush-shallow-20200710-130411-a3k90.json 340 download   job
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00068.warc.gz 5373481964 download   job
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00068.warc.os.cdx.gz 4972933 download
www.raspberrypi.org-inf-20200707-192424-bv6p7-00022.warc.gz 5368760437 download   job
www.raspberrypi.org-inf-20200707-192424-bv6p7-00022.warc.os.cdx.gz 2833646 download
www.seniorsnews.com.au-inf-20200528-062104-cuuvc-00106.warc.gz 5368743916 download   job
www.seniorsnews.com.au-inf-20200528-062104-cuuvc-00106.warc.os.cdx.gz 3383148 download
xuexi.12371.cn-inf-20200710-180859-4y33p-00000.warc.gz 4478610 download   job
xuexi.12371.cn-inf-20200710-180859-4y33p-00000.warc.os.cdx.gz 11611 download
xuexi.12371.cn-inf-20200710-180859-4y33p-meta.warc.gz 10460 download   job
xuexi.12371.cn-inf-20200710-180859-4y33p-meta.warc.os.cdx.gz 47 download
xuexi.12371.cn-inf-20200710-180859-4y33p.json 243 download   job