Item archiveteam_archivebot_go_20200711030003
Filename | Size | |
---|---|---|
archiveteam_archivebot_go_20200711030003.cdx.gz | 111182464 | download |
archiveteam_archivebot_go_20200711030003.cdx.idx | 100922 | download |
archiveteam_archivebot_go_20200711030003_files.xml | 0 | download |
archiveteam_archivebot_go_20200711030003_meta.sqlite | 705536 | download |
archiveteam_archivebot_go_20200711030003_meta.xml | 969 | download |
arcteryxkorea.tistory.com-inf-20200711-014046-2gwoc-00000.warc.gz | 15038594 | download job |
arcteryxkorea.tistory.com-inf-20200711-014046-2gwoc-00000.warc.os.cdx.gz | 16953 | download |
arcteryxkorea.tistory.com-inf-20200711-014046-2gwoc-meta.warc.gz | 15695 | download job |
arcteryxkorea.tistory.com-inf-20200711-014046-2gwoc-meta.warc.os.cdx.gz | 47 | download |
arcteryxkorea.tistory.com-inf-20200711-014046-2gwoc.json | 259 | download job |
bestgreen.tistory.com-inf-20200711-014136-3cop8-00000.warc.gz | 517351489 | download job |
bestgreen.tistory.com-inf-20200711-014136-3cop8-00000.warc.os.cdx.gz | 319764 | download |
bestgreen.tistory.com-inf-20200711-014137-culn9-meta.warc.gz | 171029 | download job |
bestgreen.tistory.com-inf-20200711-014137-culn9-meta.warc.os.cdx.gz | 47 | download |
detailog.tistory.com-inf-20200711-021238-f40xd-meta.warc.gz | 71984 | download job |
detailog.tistory.com-inf-20200711-021238-f40xd-meta.warc.os.cdx.gz | 47 | download |
dwlm.12371.cn-inf-20200710-212026-12ty6-00000.warc.gz | 5546848997 | download job |
dwlm.12371.cn-inf-20200710-212026-12ty6-00000.warc.os.cdx.gz | 1348413 | download |
dwlm.12371.cn-inf-20200710-212026-12ty6-00001.warc.gz | 2464 | download job |
dwlm.12371.cn-inf-20200710-212026-12ty6-00001.warc.os.cdx.gz | 47 | download |
dwlm.12371.cn-inf-20200710-212026-12ty6-meta.warc.gz | 763877 | download job |
dwlm.12371.cn-inf-20200710-212026-12ty6-meta.warc.os.cdx.gz | 47 | download |
dwlm.12371.cn-inf-20200710-212026-12ty6.json | 242 | download job |
eggnara.tistory.com-inf-20200711-014314-69mu4-00000.warc.gz | 24271514 | download job |
eggnara.tistory.com-inf-20200711-014314-69mu4-00000.warc.os.cdx.gz | 97258 | download |
getsatisfaction.com-inf-20200708-234031-epnla-00010.warc.gz | 5368745802 | download job |
getsatisfaction.com-inf-20200708-234031-epnla-00010.warc.os.cdx.gz | 6957738 | download |
magen.whu.edu.cn-inf-20200626-142701-6m81j-00044.warc.gz | 5640356051 | download job |
magen.whu.edu.cn-inf-20200626-142701-6m81j-00044.warc.os.cdx.gz | 1369 | download |
magen.whu.edu.cn-inf-20200626-142701-6m81j-00045.warc.gz | 5496851174 | download job |
magen.whu.edu.cn-inf-20200626-142701-6m81j-00045.warc.os.cdx.gz | 1438 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00083.warc.gz | 5373094612 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00083.warc.os.cdx.gz | 73793 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00084.warc.gz | 5415140659 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00084.warc.os.cdx.gz | 105355 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00085.warc.gz | 5390276229 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00085.warc.os.cdx.gz | 14087 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00086.warc.gz | 5374594840 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00086.warc.os.cdx.gz | 17483 | download |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00087.warc.gz | 5934821461 | download job |
mediaset.sdasofia.org-inf-20200709-091713-c8wet-00087.warc.os.cdx.gz | 10586 | download |
new.12377.cn-inf-20200710-201841-4uz15-00000.warc.gz | 5369863667 | download job |
new.12377.cn-inf-20200710-201841-4uz15-00000.warc.os.cdx.gz | 3284951 | download |
rideup.tistory.com-inf-20200711-001006-5beu9.json | 243 | download job |
soony.tistory.com-inf-20200711-000928-dt5kj-00000.warc.gz | 997776622 | download job |
soony.tistory.com-inf-20200711-000928-dt5kj-00000.warc.os.cdx.gz | 672741 | download |
soony.tistory.com-inf-20200711-000928-dt5kj-meta.warc.gz | 421855 | download job |
soony.tistory.com-inf-20200711-000928-dt5kj-meta.warc.os.cdx.gz | 47 | download |
soony.tistory.com-inf-20200711-000928-dt5kj.json | 242 | download job |
storywhy.tistory.com-inf-20200711-005446-cc0cy-00000.warc.gz | 127953690 | download job |
storywhy.tistory.com-inf-20200711-005446-cc0cy-00000.warc.os.cdx.gz | 264199 | download |
storywhy.tistory.com-inf-20200711-005446-cc0cy-meta.warc.gz | 165577 | download job |
storywhy.tistory.com-inf-20200711-005446-cc0cy-meta.warc.os.cdx.gz | 47 | download |
storywhy.tistory.com-inf-20200711-005446-cc0cy.json | 245 | download job |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2-00000.warc.gz | 616840323 | download job |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2-00000.warc.os.cdx.gz | 546326 | download |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2-meta.warc.gz | 291742 | download job |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2-urls.txt | 113389 | download |
urls-archive.max.fan-twitter-@NYPD46Pct-filtered.txt-shallow-20200711-004954-89iu2.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888-00000.warc.gz | 423748444 | download job |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888-00000.warc.os.cdx.gz | 376087 | download |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888-meta.warc.gz | 201353 | download job |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888-urls.txt | 97015 | download |
urls-archive.max.fan-twitter-@NYPD47Pct-filtered.txt-shallow-20200711-004952-6t888.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3-00000.warc.gz | 477941872 | download job |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3-00000.warc.os.cdx.gz | 460234 | download |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3-meta.warc.gz | 245575 | download job |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3-urls.txt | 106433 | download |
urls-archive.max.fan-twitter-@NYPD48Pct-filtered.txt-shallow-20200711-004950-d9pj3.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33-00000.warc.gz | 627358116 | download job |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33-00000.warc.os.cdx.gz | 560473 | download |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33-meta.warc.gz | 297732 | download job |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33-urls.txt | 137899 | download |
urls-archive.max.fan-twitter-@NYPD49Pct-filtered.txt-shallow-20200711-004705-2mw33.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son-00000.warc.gz | 318597509 | download job |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son-00000.warc.os.cdx.gz | 291025 | download |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son-meta.warc.gz | 157878 | download job |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son-urls.txt | 67535 | download |
urls-archive.max.fan-twitter-@NYPD50Pct-filtered.txt-shallow-20200711-004705-75son.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je-00000.warc.gz | 805562292 | download job |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je-00000.warc.os.cdx.gz | 767761 | download |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je-meta.warc.gz | 405850 | download job |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je-urls.txt | 213589 | download |
urls-archive.max.fan-twitter-@NYPD52Pct-filtered.txt-shallow-20200711-004127-114je.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk-00000.warc.gz | 630969261 | download job |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk-00000.warc.os.cdx.gz | 450760 | download |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk-meta.warc.gz | 240773 | download job |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk-urls.txt | 98670 | download |
urls-archive.max.fan-twitter-@NYPD5Pct-filtered.txt-shallow-20200711-004126-cs1jk.json | 331 | download job |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3-00000.warc.gz | 491251720 | download job |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3-00000.warc.os.cdx.gz | 461392 | download |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3-meta.warc.gz | 246836 | download job |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3-urls.txt | 119455 | download |
urls-archive.max.fan-twitter-@NYPD60Pct-filtered.txt-shallow-20200711-004123-csyw3.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg-00000.warc.gz | 560733288 | download job |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg-00000.warc.os.cdx.gz | 514148 | download |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg-meta.warc.gz | 274968 | download job |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg-urls.txt | 128194 | download |
urls-archive.max.fan-twitter-@NYPD61Pct-filtered.txt-shallow-20200711-004054-ai0dg.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u-00000.warc.gz | 462505630 | download job |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u-00000.warc.os.cdx.gz | 405632 | download |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u-meta.warc.gz | 218108 | download job |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u-urls.txt | 92319 | download |
urls-archive.max.fan-twitter-@NYPD62Pct-filtered.txt-shallow-20200711-004053-2yc9u.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd-00000.warc.gz | 823597865 | download job |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd-00000.warc.os.cdx.gz | 711227 | download |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd-meta.warc.gz | 377349 | download job |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd-urls.txt | 197664 | download |
urls-archive.max.fan-twitter-@NYPD63Pct-filtered.txt-shallow-20200711-004053-7t8kd.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg-00000.warc.gz | 651225677 | download job |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg-00000.warc.os.cdx.gz | 512491 | download |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg-meta.warc.gz | 274865 | download job |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg-urls.txt | 139935 | download |
urls-archive.max.fan-twitter-@NYPD66Pct-filtered.txt-shallow-20200711-002323-1h3rg.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr-00000.warc.gz | 517116791 | download job |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr-00000.warc.os.cdx.gz | 524120 | download |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr-meta.warc.gz | 279539 | download job |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr-urls.txt | 114173 | download |
urls-archive.max.fan-twitter-@NYPD67Pct-filtered.txt-shallow-20200711-002323-4l7cr.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2-00000.warc.gz | 357477002 | download job |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2-00000.warc.os.cdx.gz | 376288 | download |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2-meta.warc.gz | 204419 | download job |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2-urls.txt | 85451 | download |
urls-archive.max.fan-twitter-@NYPD68Pct-filtered.txt-shallow-20200711-002321-e1lh2.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7-00000.warc.gz | 684231716 | download job |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7-00000.warc.os.cdx.gz | 470932 | download |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7-meta.warc.gz | 248214 | download job |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7-urls.txt | 107554 | download |
urls-archive.max.fan-twitter-@NYPD69Pct-filtered.txt-shallow-20200711-002136-7och7.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo-00000.warc.gz | 334722998 | download job |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo-00000.warc.os.cdx.gz | 313772 | download |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo-meta.warc.gz | 170516 | download job |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo-urls.txt | 67704 | download |
urls-archive.max.fan-twitter-@NYPD6Pct-filtered.txt-shallow-20200711-002133-ar5xo.json | 331 | download job |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646-00000.warc.gz | 412527271 | download job |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646-00000.warc.os.cdx.gz | 374105 | download |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646-meta.warc.gz | 202353 | download job |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646-urls.txt | 85018 | download |
urls-archive.max.fan-twitter-@NYPD70Pct-filtered.txt-shallow-20200711-002132-ec646.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg-00000.warc.gz | 459755937 | download job |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg-00000.warc.os.cdx.gz | 400404 | download |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg-meta.warc.gz | 214763 | download job |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg-urls.txt | 106531 | download |
urls-archive.max.fan-twitter-@NYPD71Pct-filtered.txt-shallow-20200711-002132-42pfg.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0-00000.warc.gz | 1316752400 | download job |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0-00000.warc.os.cdx.gz | 962923 | download |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0-meta.warc.gz | 503962 | download job |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0-urls.txt | 234553 | download |
urls-archive.max.fan-twitter-@NYPD72Pct-filtered.txt-shallow-20200711-002131-40nh0.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2-00000.warc.gz | 422864914 | download job |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2-00000.warc.os.cdx.gz | 421143 | download |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2-meta.warc.gz | 225926 | download job |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2-urls.txt | 104865 | download |
urls-archive.max.fan-twitter-@NYPD73Pct-filtered.txt-shallow-20200711-000458-65uj2.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i-00000.warc.gz | 440659033 | download job |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i-00000.warc.os.cdx.gz | 432705 | download |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i-meta.warc.gz | 232347 | download job |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i-urls.txt | 114396 | download |
urls-archive.max.fan-twitter-@NYPD75Pct-filtered.txt-shallow-20200711-000456-ckw0i.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma-00000.warc.gz | 267565376 | download job |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma-00000.warc.os.cdx.gz | 287185 | download |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma-meta.warc.gz | 157345 | download job |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma-urls.txt | 71413 | download |
urls-archive.max.fan-twitter-@NYPD76Pct-filtered.txt-shallow-20200711-000450-9v6ma.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq-00000.warc.gz | 877850138 | download job |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq-00000.warc.os.cdx.gz | 930300 | download |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq-meta.warc.gz | 492919 | download job |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq-urls.txt | 252970 | download |
urls-archive.max.fan-twitter-@NYPD77Pct-filtered.txt-shallow-20200710-235931-944bq.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx-00000.warc.gz | 542610872 | download job |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx-00000.warc.os.cdx.gz | 551701 | download |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx-meta.warc.gz | 296063 | download job |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx-urls.txt | 157620 | download |
urls-archive.max.fan-twitter-@NYPD78Pct-filtered.txt-shallow-20200710-235930-glidx.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp-00000.warc.gz | 489497397 | download job |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp-00000.warc.os.cdx.gz | 459236 | download |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp-meta.warc.gz | 245804 | download job |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp-urls.txt | 115905 | download |
urls-archive.max.fan-twitter-@NYPD79Pct-filtered.txt-shallow-20200710-235511-a2zbp.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm-00000.warc.gz | 378794809 | download job |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm-00000.warc.os.cdx.gz | 379227 | download |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm-meta.warc.gz | 204619 | download job |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm-urls.txt | 91442 | download |
urls-archive.max.fan-twitter-@NYPD7Pct-filtered.txt-shallow-20200710-235507-ckpxm.json | 331 | download job |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12-00000.warc.gz | 553406943 | download job |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12-00000.warc.os.cdx.gz | 398100 | download |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12-meta.warc.gz | 210534 | download job |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12-urls.txt | 101874 | download |
urls-archive.max.fan-twitter-@NYPD81Pct-filtered.txt-shallow-20200710-235506-eze12.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw-00000.warc.gz | 884617871 | download job |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw-00000.warc.os.cdx.gz | 740417 | download |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw-meta.warc.gz | 391466 | download job |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw-urls.txt | 195969 | download |
urls-archive.max.fan-twitter-@NYPD83Pct-filtered.txt-shallow-20200710-235506-1rsmw.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt-00000.warc.gz | 480725772 | download job |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt-00000.warc.os.cdx.gz | 401226 | download |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt-meta.warc.gz | 213473 | download job |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt-urls.txt | 92974 | download |
urls-archive.max.fan-twitter-@NYPD84Pct-filtered.txt-shallow-20200710-234919-6byjt.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z-00000.warc.gz | 445585665 | download job |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z-00000.warc.os.cdx.gz | 448434 | download |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z-meta.warc.gz | 241810 | download job |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z-urls.txt | 120300 | download |
urls-archive.max.fan-twitter-@NYPD88Pct-filtered.txt-shallow-20200710-234918-6208z.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w-00000.warc.gz | 407533555 | download job |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w-00000.warc.os.cdx.gz | 416999 | download |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w-meta.warc.gz | 226317 | download job |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w-urls.txt | 120910 | download |
urls-archive.max.fan-twitter-@NYPD90Pct-filtered.txt-shallow-20200710-234916-1yn3w.json | 333 | download job |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2-00000.warc.gz | 841197712 | download job |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2-00000.warc.os.cdx.gz | 1146558 | download |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2-meta.warc.gz | 612342 | download job |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2-urls.txt | 150142 | download |
urls-archive.max.fan-twitter-@NYPDCT-filtered.txt-shallow-20200710-232602-4izi2.json | 327 | download job |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut-00000.warc.gz | 1162400083 | download job |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut-00000.warc.os.cdx.gz | 862213 | download |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut-meta.warc.gz | 456244 | download job |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut-urls.txt | 150624 | download |
urls-archive.max.fan-twitter-@NYPDCeremonial-filtered.txt-shallow-20200710-232831-dz5ut.json | 343 | download job |
urls-archive.max.fan-twitter-@NYPDChiefPatrol-filtered.txt-shallow-20200710-232803-7gj0y-00000.warc.gz | 579805487 | download job |
urls-archive.max.fan-twitter-@NYPDChiefPatrol-filtered.txt-shallow-20200710-232803-7gj0y-00000.warc.os.cdx.gz | 670680 | download |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e-00000.warc.gz | 670813167 | download job |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e-00000.warc.os.cdx.gz | 993222 | download |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e-meta.warc.gz | 533314 | download job |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e-urls.txt | 141572 | download |
urls-archive.max.fan-twitter-@NYPDChiefofDept-filtered.txt-shallow-20200710-232829-3fa7e.json | 345 | download job |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw-00000.warc.gz | 2020779107 | download job |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw-00000.warc.os.cdx.gz | 1725406 | download |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw-meta.warc.gz | 904311 | download job |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw-urls.txt | 435474 | download |
urls-archive.max.fan-twitter-@NYPDCommAffairs-filtered.txt-shallow-20200710-232739-5q4qw.json | 345 | download job |
urls-archive.max.fan-twitter-@NYPDDCPI-filtered.txt-shallow-20200710-232342-cxwt2.json | 331 | download job |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav-00000.warc.gz | 555155038 | download job |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav-00000.warc.os.cdx.gz | 967208 | download |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav-meta.warc.gz | 517205 | download job |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav-urls.txt | 163451 | download |
urls-archive.max.fan-twitter-@NYPDDetectives-filtered.txt-shallow-20200710-232232-98hav.json | 343 | download job |
urls-archive.max.fan-twitter-@NYPDShea-filtered.txt-shallow-20200710-221743-8vm3u-meta.warc.gz | 600597 | download job |
urls-archive.max.fan-twitter-@NYPDShea-filtered.txt-shallow-20200710-221743-8vm3u-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa-00000.warc.gz | 1151933012 | download job |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa-00000.warc.os.cdx.gz | 807851 | download |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa-meta.warc.gz | 423460 | download job |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa-urls.txt | 193059 | download |
urls-archive.max.fan-twitter-@NYPDauxiliary-filtered.txt-shallow-20200710-233513-42rwa.json | 341 | download job |
urls-archive.max.fan-twitter-@NYTObits-filtered.txt-shallow-20200710-211552-2uhg1.json | 331 | download job |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e-00000.warc.gz | 2808193317 | download job |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e-00000.warc.os.cdx.gz | 6746298 | download |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e-meta.warc.gz | 3536539 | download job |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e-urls.txt | 1473279 | download |
urls-archive.max.fan-twitter-@NYTmag-filtered.txt-shallow-20200710-211953-axv3e.json | 327 | download job |
urls-archive.max.fan-twitter-@PlymouthNHPD-filtered.txt-shallow-20200711-025159-5ldgv-00000.warc.gz | 3586425 | download job |
urls-archive.max.fan-twitter-@PlymouthNHPD-filtered.txt-shallow-20200711-025159-5ldgv-00000.warc.os.cdx.gz | 7603 | download |
urls-archive.max.fan-twitter-@PlymouthNHPD-filtered.txt-shallow-20200711-025159-5ldgv.json | 339 | download job |
urls-archive.max.fan-twitter-@Plymouth_Police-filtered.txt-shallow-20200711-024522-695lw-meta.warc.gz | 81637 | download job |
urls-archive.max.fan-twitter-@Plymouth_Police-filtered.txt-shallow-20200711-024522-695lw-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Plymouth_Police-filtered.txt-shallow-20200711-024522-695lw.json | 345 | download job |
urls-archive.max.fan-twitter-@RPD02370-filtered.txt-shallow-20200711-023117-f33wk-meta.warc.gz | 37221 | download job |
urls-archive.max.fan-twitter-@RPD02370-filtered.txt-shallow-20200711-023117-f33wk-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@RehobothPD-filtered.txt-shallow-20200711-024228-44tqz-urls.txt | 19274 | download |
urls-archive.max.fan-twitter-@RehobothPD-filtered.txt-shallow-20200711-024228-44tqz.json | 335 | download job |
urls-archive.max.fan-twitter-@RepTomConroy-filtered.txt-shallow-20200711-023822-4f84d.json | 339 | download job |
urls-archive.max.fan-twitter-@RockSheriffNH-filtered.txt-shallow-20200711-023119-buhk0-00000.warc.gz | 74438149 | download job |
urls-archive.max.fan-twitter-@RockSheriffNH-filtered.txt-shallow-20200711-023119-buhk0-00000.warc.os.cdx.gz | 90586 | download |
urls-archive.max.fan-twitter-@SCDPS_PIO-filtered.txt-shallow-20200711-022645-36kxj-00000.warc.gz | 275054688 | download job |
urls-archive.max.fan-twitter-@SCDPS_PIO-filtered.txt-shallow-20200711-022645-36kxj-00000.warc.os.cdx.gz | 444466 | download |
urls-archive.max.fan-twitter-@SCDPS_PIO-filtered.txt-shallow-20200711-022645-36kxj-urls.txt | 94438 | download |
urls-archive.max.fan-twitter-@SCDPS_PIO-filtered.txt-shallow-20200711-022645-36kxj.json | 333 | download job |
urls-archive.max.fan-twitter-@SPD_HQ-filtered.txt-shallow-20200711-014217-4v4oq-00000.warc.gz | 103716061 | download job |
urls-archive.max.fan-twitter-@SPD_HQ-filtered.txt-shallow-20200711-014217-4v4oq-00000.warc.os.cdx.gz | 149813 | download |
urls-archive.max.fan-twitter-@SPD_HQ-filtered.txt-shallow-20200711-014217-4v4oq-meta.warc.gz | 84121 | download job |
urls-archive.max.fan-twitter-@SPD_HQ-filtered.txt-shallow-20200711-014217-4v4oq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SPD_HQ-filtered.txt-shallow-20200711-014217-4v4oq-urls.txt | 86960 | download |
urls-archive.max.fan-twitter-@SbgePolice-filtered.txt-shallow-20200711-022834-9g09r-00000.warc.gz | 1089099 | download job |
urls-archive.max.fan-twitter-@SbgePolice-filtered.txt-shallow-20200711-022834-9g09r-00000.warc.os.cdx.gz | 4874 | download |
urls-archive.max.fan-twitter-@SgtDearthHPD-filtered.txt-shallow-20200711-021012-50p2v-urls.txt | 149345 | download |
urls-archive.max.fan-twitter-@SharonMAPolice-filtered.txt-shallow-20200711-020735-6l7mv-00000.warc.gz | 341256687 | download job |
urls-archive.max.fan-twitter-@SharonMAPolice-filtered.txt-shallow-20200711-020735-6l7mv-00000.warc.os.cdx.gz | 269972 | download |
urls-archive.max.fan-twitter-@SherbornMAPD-filtered.txt-shallow-20200711-020733-4auqz-00000.warc.gz | 38016771 | download job |
urls-archive.max.fan-twitter-@SherbornMAPD-filtered.txt-shallow-20200711-020733-4auqz-00000.warc.os.cdx.gz | 47165 | download |
urls-archive.max.fan-twitter-@SheriffBowler-filtered.txt-shallow-20200711-020640-2vn3f-00000.warc.gz | 29531935 | download job |
urls-archive.max.fan-twitter-@SheriffBowler-filtered.txt-shallow-20200711-020640-2vn3f-00000.warc.os.cdx.gz | 30426 | download |
urls-archive.max.fan-twitter-@SheriffBowler-filtered.txt-shallow-20200711-020640-2vn3f.json | 341 | download job |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585-00000.warc.gz | 40172909 | download job |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585-00000.warc.os.cdx.gz | 47766 | download |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585-meta.warc.gz | 29803 | download job |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585-urls.txt | 38979 | download |
urls-archive.max.fan-twitter-@SouthHadley_PD-filtered.txt-shallow-20200711-014319-9z585.json | 343 | download job |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7-00000.warc.gz | 13353431 | download job |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7-00000.warc.os.cdx.gz | 20979 | download |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7-meta.warc.gz | 15570 | download job |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7-urls.txt | 4360 | download |
urls-archive.max.fan-twitter-@SouthboroughPd-filtered.txt-shallow-20200711-014409-d52l7.json | 343 | download job |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu-00000.warc.gz | 129253310 | download job |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu-00000.warc.os.cdx.gz | 107028 | download |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu-meta.warc.gz | 61317 | download job |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu-urls.txt | 29515 | download |
urls-archive.max.fan-twitter-@SpencerMAPolice-filtered.txt-shallow-20200711-014207-dcexu.json | 345 | download job |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j-00000.warc.gz | 74665277 | download job |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j-00000.warc.os.cdx.gz | 104001 | download |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j-meta.warc.gz | 60179 | download job |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j-urls.txt | 28593 | download |
urls-archive.max.fan-twitter-@StonehamMAPD-filtered.txt-shallow-20200711-014201-85z9j.json | 339 | download job |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31-00000.warc.gz | 179346321 | download job |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31-00000.warc.os.cdx.gz | 251096 | download |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31-meta.warc.gz | 136769 | download job |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31-urls.txt | 115955 | download |
urls-archive.max.fan-twitter-@StoughtonPD-filtered.txt-shallow-20200711-014200-eeq31.json | 337 | download job |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5-00000.warc.gz | 204306209 | download job |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5-00000.warc.os.cdx.gz | 205261 | download |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5-meta.warc.gz | 113414 | download job |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5-urls.txt | 98089 | download |
urls-archive.max.fan-twitter-@Sturbridge_PD-filtered.txt-shallow-20200711-013708-aayh5.json | 341 | download job |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx-00000.warc.gz | 48958688 | download job |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx-00000.warc.os.cdx.gz | 77654 | download |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx-meta.warc.gz | 46368 | download job |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx-urls.txt | 35818 | download |
urls-archive.max.fan-twitter-@Sudbury_Police-filtered.txt-shallow-20200711-013705-dipcx.json | 343 | download job |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3-00000.warc.gz | 25839431 | download job |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3-00000.warc.os.cdx.gz | 32149 | download |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3-meta.warc.gz | 21712 | download job |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3-urls.txt | 18476 | download |
urls-archive.max.fan-twitter-@SunderlandMAPD-filtered.txt-shallow-20200711-013701-f1cq3.json | 343 | download job |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias-00000.warc.gz | 27040451 | download job |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias-00000.warc.os.cdx.gz | 49317 | download |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias-meta.warc.gz | 31082 | download job |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias-urls.txt | 23766 | download |
urls-archive.max.fan-twitter-@SwampscottPD-filtered.txt-shallow-20200711-013420-bgias.json | 339 | download job |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju-00000.warc.gz | 6548604 | download job |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju-00000.warc.os.cdx.gz | 9855 | download |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju-meta.warc.gz | 9506 | download job |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju-urls.txt | 5472 | download |
urls-archive.max.fan-twitter-@TorrisiRep-filtered.txt-shallow-20200711-012834-8qjju.json | 335 | download job |
urls-archive.max.fan-twitter-@TownofBrookline-filtered.txt-shallow-20200711-012831-1q1xn-00000.warc.gz | 458913052 | download job |
urls-archive.max.fan-twitter-@TownofBrookline-filtered.txt-shallow-20200711-012831-1q1xn-00000.warc.os.cdx.gz | 491866 | download |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc-00000.warc.gz | 50835277 | download job |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc-00000.warc.os.cdx.gz | 65347 | download |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc-meta.warc.gz | 39196 | download job |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc-urls.txt | 45916 | download |
urls-archive.max.fan-twitter-@TownsendPD-filtered.txt-shallow-20200711-012830-cw3xc.json | 335 | download job |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4-00000.warc.gz | 175200968 | download job |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4-00000.warc.os.cdx.gz | 203880 | download |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4-meta.warc.gz | 113014 | download job |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4-urls.txt | 99853 | download |
urls-archive.max.fan-twitter-@TyngsboroughPD-filtered.txt-shallow-20200711-012827-6t1o4.json | 343 | download job |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd-00000.warc.gz | 153162215 | download job |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd-00000.warc.os.cdx.gz | 194676 | download |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd-meta.warc.gz | 108733 | download job |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd-urls.txt | 88431 | download |
urls-archive.max.fan-twitter-@UMassDPolice-filtered.txt-shallow-20200711-012821-2p5yd.json | 339 | download job |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w-00000.warc.gz | 198382233 | download job |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w-00000.warc.os.cdx.gz | 258013 | download |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w-meta.warc.gz | 142430 | download job |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w-urls.txt | 149120 | download |
urls-archive.max.fan-twitter-@UNH_Police-filtered.txt-shallow-20200711-012402-1j25w.json | 335 | download job |
urls-archive.max.fan-twitter-@USDOT-filtered.txt-shallow-20200711-012401-707qn.json | 325 | download job |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i-00000.warc.gz | 348523643 | download job |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i-00000.warc.os.cdx.gz | 623444 | download |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i-meta.warc.gz | 338563 | download job |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i-urls.txt | 146429 | download |
urls-archive.max.fan-twitter-@UTHighwayPatrol-filtered.txt-shallow-20200711-012356-a5p8i.json | 345 | download job |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz-00000.warc.gz | 244788334 | download job |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz-00000.warc.os.cdx.gz | 218676 | download |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz-meta.warc.gz | 119385 | download job |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz-urls.txt | 121614 | download |
urls-archive.max.fan-twitter-@WESTON_FIRE-filtered.txt-shallow-20200711-011658-169mz.json | 337 | download job |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3-00000.warc.gz | 31342319 | download job |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3-00000.warc.os.cdx.gz | 45002 | download |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3-meta.warc.gz | 28802 | download job |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3-urls.txt | 22481 | download |
urls-archive.max.fan-twitter-@WPD25-filtered.txt-shallow-20200711-011413-a6dc3.json | 325 | download job |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht-00000.warc.gz | 56992919 | download job |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht-00000.warc.os.cdx.gz | 85664 | download |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht-meta.warc.gz | 50357 | download job |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht-urls.txt | 49287 | download |
urls-archive.max.fan-twitter-@WPDComm-filtered.txt-shallow-20200711-005244-93hht.json | 329 | download job |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7-00000.warc.gz | 147169216 | download job |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7-00000.warc.os.cdx.gz | 250085 | download |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7-meta.warc.gz | 138240 | download job |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7-urls.txt | 110840 | download |
urls-archive.max.fan-twitter-@WVStatePolice-filtered.txt-shallow-20200711-005242-c4of7.json | 341 | download job |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy-00000.warc.gz | 106642189 | download job |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy-00000.warc.os.cdx.gz | 158261 | download |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy-meta.warc.gz | 89027 | download job |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy-urls.txt | 55928 | download |
urls-archive.max.fan-twitter-@WakefieldPD-filtered.txt-shallow-20200711-011953-cgcoy.json | 337 | download job |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg-00000.warc.gz | 111092643 | download job |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg-00000.warc.os.cdx.gz | 103605 | download |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg-meta.warc.gz | 59957 | download job |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg-urls.txt | 25950 | download |
urls-archive.max.fan-twitter-@WalthamFireDept-filtered.txt-shallow-20200711-011952-3itmg.json | 345 | download job |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml-00000.warc.gz | 303231968 | download job |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml-00000.warc.os.cdx.gz | 453704 | download |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml-meta.warc.gz | 247252 | download job |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml-urls.txt | 210353 | download |
urls-archive.max.fan-twitter-@WalthamMAPolice-filtered.txt-shallow-20200711-011951-qgoml.json | 345 | download job |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5-00000.warc.gz | 166680460 | download job |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5-00000.warc.os.cdx.gz | 217056 | download |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5-meta.warc.gz | 120614 | download job |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5-urls.txt | 56610 | download |
urls-archive.max.fan-twitter-@WatertownPD-filtered.txt-shallow-20200711-011924-2pjv5.json | 337 | download job |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h-00000.warc.gz | 10655751 | download job |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h-00000.warc.os.cdx.gz | 12771 | download |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h-meta.warc.gz | 11091 | download job |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h-urls.txt | 10167 | download |
urls-archive.max.fan-twitter-@WentworthPolice-filtered.txt-shallow-20200711-011815-d3w5h.json | 345 | download job |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296-00000.warc.gz | 34884337 | download job |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296-00000.warc.os.cdx.gz | 48714 | download |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296-meta.warc.gz | 30725 | download job |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296-urls.txt | 27073 | download |
urls-archive.max.fan-twitter-@WestNewburyPD-filtered.txt-shallow-20200711-011659-ct296.json | 341 | download job |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux-00000.warc.gz | 141655241 | download job |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux-00000.warc.os.cdx.gz | 156612 | download |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux-meta.warc.gz | 88193 | download job |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux-urls.txt | 75684 | download |
urls-archive.max.fan-twitter-@WestminsterPDMA-filtered.txt-shallow-20200711-011815-ddlux.json | 345 | download job |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td-00000.warc.gz | 30730919 | download job |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td-00000.warc.os.cdx.gz | 43636 | download |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td-meta.warc.gz | 27942 | download job |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td-urls.txt | 28139 | download |
urls-archive.max.fan-twitter-@WestonMAPD-filtered.txt-shallow-20200711-011657-990td.json | 335 | download job |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4-00000.warc.gz | 46713632 | download job |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4-00000.warc.os.cdx.gz | 64752 | download |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4-meta.warc.gz | 40828 | download job |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4-urls.txt | 40046 | download |
urls-archive.max.fan-twitter-@WhitmanPolice-filtered.txt-shallow-20200711-011444-bfqj4.json | 341 | download job |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7-00000.warc.gz | 156668475 | download job |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7-00000.warc.os.cdx.gz | 171372 | download |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7-meta.warc.gz | 94668 | download job |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7-urls.txt | 95538 | download |
urls-archive.max.fan-twitter-@WichitaFallsPD-filtered.txt-shallow-20200711-011441-ciin7.json | 343 | download job |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo-00000.warc.gz | 16168322 | download job |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo-00000.warc.os.cdx.gz | 34815 | download |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo-meta.warc.gz | 23283 | download job |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo-urls.txt | 13799 | download |
urls-archive.max.fan-twitter-@Winthroppolice-filtered.txt-shallow-20200711-011419-6qfgo.json | 343 | download job |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq-00000.warc.gz | 17280276 | download job |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq-00000.warc.os.cdx.gz | 35228 | download |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq-meta.warc.gz | 23472 | download job |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq-urls.txt | 7359 | download |
urls-archive.max.fan-twitter-@WoburnFire-filtered.txt-shallow-20200711-011417-bncrq.json | 335 | download job |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9-00000.warc.gz | 44591383 | download job |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9-00000.warc.os.cdx.gz | 90301 | download |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9-meta.warc.gz | 53119 | download job |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9-urls.txt | 35577 | download |
urls-archive.max.fan-twitter-@WoburnPolice-filtered.txt-shallow-20200711-011415-85xw9.json | 339 | download job |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-00000.warc.gz | 5368893933 | download job |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-00000.warc.os.cdx.gz | 10576265 | download |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-00001.warc.gz | 55906868 | download job |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-00001.warc.os.cdx.gz | 222698 | download |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-meta.warc.gz | 5617071 | download job |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h-urls.txt | 3056152 | download |
urls-archive.max.fan-twitter-@nytchinese-filtered.txt-shallow-20200710-215302-2fo5h.json | 335 | download job |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4-00000.warc.gz | 2892253551 | download job |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4-00000.warc.os.cdx.gz | 7972631 | download |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4-meta.warc.gz | 4137368 | download job |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4-urls.txt | 1413564 | download |
urls-archive.max.fan-twitter-@nytimeses-filtered.txt-shallow-20200710-214509-ckhq4.json | 333 | download job |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d-00000.warc.gz | 3646797793 | download job |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d-00000.warc.os.cdx.gz | 7766292 | download |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d-meta.warc.gz | 4025244 | download job |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d-urls.txt | 2950233 | download |
urls-archive.max.fan-twitter-@nytimesmusic-filtered.txt-shallow-20200710-213821-36h4d.json | 339 | download job |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-00000.warc.gz | 5369522753 | download job |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-00000.warc.os.cdx.gz | 3129891 | download |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-00001.warc.gz | 2022088746 | download job |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-00001.warc.os.cdx.gz | 797060 | download |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-meta.warc.gz | 2116804 | download job |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2-urls.txt | 2030981 | download |
urls-archive.max.fan-twitter-@nytrealestate-filtered.txt-shallow-20200710-211550-e9nz2.json | 341 | download job |
urls-archive.max.fan-twitter-@rccampuspolice-filtered.txt-shallow-20200711-024447-a4sly-00000.warc.gz | 117082317 | download job |
urls-archive.max.fan-twitter-@rccampuspolice-filtered.txt-shallow-20200711-024447-a4sly-00000.warc.os.cdx.gz | 125664 | download |
urls-archive.max.fan-twitter-@rccampuspolice-filtered.txt-shallow-20200711-024447-a4sly-urls.txt | 61179 | download |
urls-archive.max.fan-twitter-@rconnollyHPD46-filtered.txt-shallow-20200711-024447-51nv6-00000.warc.gz | 53368938 | download job |
urls-archive.max.fan-twitter-@rconnollyHPD46-filtered.txt-shallow-20200711-024447-51nv6-00000.warc.os.cdx.gz | 42571 | download |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi-00000.warc.gz | 25068083 | download job |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi-00000.warc.os.cdx.gz | 34205 | download |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi-meta.warc.gz | 22889 | download job |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi-urls.txt | 24327 | download |
urls-archive.max.fan-twitter-@templetonpolice-filtered.txt-shallow-20200711-013419-901fi.json | 345 | download job |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse-00000.warc.gz | 45240697 | download job |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse-00000.warc.os.cdx.gz | 50782 | download |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse-meta.warc.gz | 31747 | download job |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse-urls.txt | 31193 | download |
urls-archive.max.fan-twitter-@tisburypolice-filtered.txt-shallow-20200711-012849-dzuse.json | 341 | download job |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss-00000.warc.gz | 15942618 | download job |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss-00000.warc.os.cdx.gz | 24656 | download |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss-meta.warc.gz | 17806 | download job |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss-urls.txt | 8947 | download |
urls-archive.max.fan-twitter-@wenhampolice-filtered.txt-shallow-20200711-011921-eauss.json | 339 | download job |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb-00000.warc.gz | 122496568 | download job |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb-00000.warc.os.cdx.gz | 136373 | download |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb-meta.warc.gz | 75969 | download job |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb-urls.txt | 124705 | download |
urls-archive.max.fan-twitter-@wilbrahampolice-filtered.txt-shallow-20200711-011439-41ttb.json | 345 | download job |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej-00000.warc.gz | 462838820 | download job |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej-00000.warc.os.cdx.gz | 555172 | download |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej-meta.warc.gz | 295382 | download job |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej-meta.warc.os.cdx.gz | 47 | download |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej-urls.txt | 448600 | download |
urls-archive.max.fan-twitter-@yarmouthpolice-filtered.txt-shallow-20200711-005241-1fxej.json | 343 | download job |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-00001.warc.gz | 5381668396 | download job |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-00001.warc.os.cdx.gz | 625340 | download |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-00002.warc.gz | 445927842 | download job |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-00002.warc.os.cdx.gz | 300633 | download |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-meta.warc.gz | 792598 | download job |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-meta.warc.os.cdx.gz | 47 | download |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e-urls.txt | 210114 | download |
urls-transfer.notkiska.pw-facebook-@fieldcraftsurvival-shallow-20200710-225005-as74e.json | 350 | download job |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00106.warc.gz | 5369544029 | download job |
urls-transfer.notkiska.pw-twitter-%23notmypresident-shallow-20200530-220957-2c0z0-00106.warc.os.cdx.gz | 501162 | download |
urls-transfer.notkiska.pw-twitter-@fieldcrafttweet-shallow-20200710-224418-2rklm-00000.warc.gz | 5463549412 | download job |
urls-transfer.notkiska.pw-twitter-@fieldcrafttweet-shallow-20200710-224418-2rklm-00000.warc.os.cdx.gz | 163792 | download |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00070.warc.gz | 5392372211 | download job |
urls-transfer.notkiska.pw-vote-usa_org-twitter-accounts-outlinks.1.txt-shallow-20200609-230435-7k4tj-00070.warc.os.cdx.gz | 1163469 | download |
windowx.tistory.com-inf-20200711-014001-elvij-00000.warc.gz | 79799675 | download job |
windowx.tistory.com-inf-20200711-014001-elvij-00000.warc.os.cdx.gz | 159286 | download |
windowx.tistory.com-inf-20200711-014001-elvij-meta.warc.gz | 103097 | download job |
windowx.tistory.com-inf-20200711-014001-elvij-meta.warc.os.cdx.gz | 47 | download |
windowx.tistory.com-inf-20200711-014001-elvij.json | 253 | download job |
www.12371.cn-inf-20200709-194054-1lotk-00008.warc.gz | 5368791348 | download job |
www.12371.cn-inf-20200709-194054-1lotk-00008.warc.os.cdx.gz | 3408522 | download |
www.boomerangfu.com-inf-20200710-233441-7k64i.json | 243 | download job |
www.mathway.com-inf-20200610-011458-6sruz-00020.warc.gz | 5368731684 | download job |
www.mathway.com-inf-20200610-011458-6sruz-00020.warc.os.cdx.gz | 21213600 | download |
www.raspberrypi.org-inf-20200707-192424-bv6p7-00023.warc.gz | 5368838040 | download job |
www.raspberrypi.org-inf-20200707-192424-bv6p7-00023.warc.os.cdx.gz | 3009024 | download |
www.swtor.com-inf-20200224-042317-1qahy-00153.warc.gz | 5368956018 | download job |
www.swtor.com-inf-20200224-042317-1qahy-00153.warc.os.cdx.gz | 1422318 | download |
www.taringa.net-inf-20190927-205127-2a0h7-00698.warc.gz | 5368778159 | download job |
www.taringa.net-inf-20190927-205127-2a0h7-00698.warc.os.cdx.gz | 3203980 | download |