.gitignore
.pre-commit-config.yaml
LICENSE
MANIFEST.in
Pipfile
Pipfile.lock
README.md
setup.cfg
setup.py
test.py
.github/workflows/continuous-deployment.yaml
.github/workflows/docs.yaml
_notebooks/compare.ipynb
_notebooks/label.ipynb
_notebooks/sample.ipynb
_notebooks/train.ipynb
_notebooks/input/labeled.csv
_notebooks/input/sample.csv
_notebooks/input/20220730-sample/100reporters.hyperlinks.json
_notebooks/input/20220730-sample/11alivenews.hyperlinks.json
_notebooks/input/20220730-sample/12khari.hyperlinks.json
_notebooks/input/20220730-sample/12newsnow.hyperlinks.json
_notebooks/input/20220730-sample/13wmaznews.hyperlinks.json
_notebooks/input/20220730-sample/14eastmag.hyperlinks.json
_notebooks/input/20220730-sample/19thnews.hyperlinks.json
_notebooks/input/20220730-sample/20minutes.hyperlinks.json
_notebooks/input/20220730-sample/41nbc.hyperlinks.json
_notebooks/input/20220730-sample/6abc.hyperlinks.json
_notebooks/input/20220730-sample/9to5mac.hyperlinks.json
_notebooks/input/20220730-sample/abc.hyperlinks.json
_notebooks/input/20220730-sample/abc15.hyperlinks.json
_notebooks/input/20220730-sample/abc7.hyperlinks.json
_notebooks/input/20220730-sample/abqjournal.hyperlinks.json
_notebooks/input/20220730-sample/aftenposten.hyperlinks.json
_notebooks/input/20220730-sample/ajenglish.hyperlinks.json
_notebooks/input/20220730-sample/albany_herald.hyperlinks.json
_notebooks/input/20220730-sample/aldiadallas.hyperlinks.json
_notebooks/input/20220730-sample/alternet.hyperlinks.json
_notebooks/input/20220730-sample/amestribnews.hyperlinks.json
_notebooks/input/20220730-sample/annapurna_post.hyperlinks.json
_notebooks/input/20220730-sample/ap.hyperlinks.json
_notebooks/input/20220730-sample/appalachia100.hyperlinks.json
_notebooks/input/20220730-sample/arizcir.hyperlinks.json
_notebooks/input/20220730-sample/arknewsorg.hyperlinks.json
_notebooks/input/20220730-sample/ashlandornews.hyperlinks.json
_notebooks/input/20220730-sample/aspenjournalism.hyperlinks.json
_notebooks/input/20220730-sample/austinchronicle.hyperlinks.json
_notebooks/input/20220730-sample/austinvida.hyperlinks.json
_notebooks/input/20220730-sample/avlwatchdog.hyperlinks.json
_notebooks/input/20220730-sample/bakersfieldcali.hyperlinks.json
_notebooks/input/20220730-sample/baltbizonline.hyperlinks.json
_notebooks/input/20220730-sample/baltimorebanner.hyperlinks.json
_notebooks/input/20220730-sample/baltimorebrew.hyperlinks.json
_notebooks/input/20220730-sample/baltimoremag.hyperlinks.json
_notebooks/input/20220730-sample/beltel.hyperlinks.json
_notebooks/input/20220730-sample/berkeleyside.hyperlinks.json
_notebooks/input/20220730-sample/berkshireeagle.hyperlinks.json
_notebooks/input/20220730-sample/bettergov.hyperlinks.json
_notebooks/input/20220730-sample/bfmtv.hyperlinks.json
_notebooks/input/20220730-sample/bhamwatch.hyperlinks.json
_notebooks/input/20220730-sample/binjreports.hyperlinks.json
_notebooks/input/20220730-sample/blackbygodwv.hyperlinks.json
_notebooks/input/20220730-sample/blaw.hyperlinks.json
_notebooks/input/20220730-sample/bleacherreport.hyperlinks.json
_notebooks/input/20220730-sample/bleepincomputer.hyperlinks.json
_notebooks/input/20220730-sample/blockclubchi.hyperlinks.json
_notebooks/input/20220730-sample/bmtenterprise.hyperlinks.json
_notebooks/input/20220730-sample/boingboing.hyperlinks.json
_notebooks/input/20220730-sample/bonginoreport.hyperlinks.json
_notebooks/input/20220730-sample/bostonglobe.hyperlinks.json
_notebooks/input/20220730-sample/bostonherald.hyperlinks.json
_notebooks/input/20220730-sample/brecktexan.hyperlinks.json
_notebooks/input/20220730-sample/breitbartnews.hyperlinks.json
_notebooks/input/20220730-sample/brunswick_news.hyperlinks.json
_notebooks/input/20220730-sample/buckscoherald.hyperlinks.json
_notebooks/input/20220730-sample/bulwarkonline.hyperlinks.json
_notebooks/input/20220730-sample/buzzfeednews.hyperlinks.json
_notebooks/input/20220730-sample/calmatters.hyperlinks.json
_notebooks/input/20220730-sample/capitalb_atl.hyperlinks.json
_notebooks/input/20220730-sample/capitolnewsil.hyperlinks.json
_notebooks/input/20220730-sample/cbs7news.hyperlinks.json
_notebooks/input/20220730-sample/cbsnews.hyperlinks.json
_notebooks/input/20220730-sample/chalkbeat.hyperlinks.json
_notebooks/input/20220730-sample/chequeado.hyperlinks.json
_notebooks/input/20220730-sample/chesbayjournal.hyperlinks.json
_notebooks/input/20220730-sample/chessbase.hyperlinks.json
_notebooks/input/20220730-sample/chicago_reader.hyperlinks.json
_notebooks/input/20220730-sample/chicagoreporter.hyperlinks.json
_notebooks/input/20220730-sample/ciceronoticias.hyperlinks.json
_notebooks/input/20220730-sample/civilbeat.hyperlinks.json
_notebooks/input/20220730-sample/cjr.hyperlinks.json
_notebooks/input/20220730-sample/claytoncrescent.hyperlinks.json
_notebooks/input/20220730-sample/climatecentral.hyperlinks.json
_notebooks/input/20220730-sample/cnet.hyperlinks.json
_notebooks/input/20220730-sample/cnsmd.hyperlinks.json
_notebooks/input/20220730-sample/codaily.hyperlinks.json
_notebooks/input/20220730-sample/coindesk.hyperlinks.json
_notebooks/input/20220730-sample/comissourian.hyperlinks.json
_notebooks/input/20220730-sample/cookpolitical.hyperlinks.json
_notebooks/input/20220730-sample/cpublicpress.hyperlinks.json
_notebooks/input/20220730-sample/cqnow.hyperlinks.json
_notebooks/input/20220730-sample/crucessunnews.hyperlinks.json
_notebooks/input/20220730-sample/dagsavisen.hyperlinks.json
_notebooks/input/20220730-sample/daily_record.hyperlinks.json
_notebooks/input/20220730-sample/dailycaller.hyperlinks.json
_notebooks/input/20220730-sample/dainikbhaskar.hyperlinks.json
_notebooks/input/20220730-sample/dallasbiznews.hyperlinks.json
_notebooks/input/20220730-sample/deadline.hyperlinks.json
_notebooks/input/20220730-sample/deadspin.hyperlinks.json
_notebooks/input/20220730-sample/decisiondeskhq.hyperlinks.json
_notebooks/input/20220730-sample/defectormedia.hyperlinks.json
_notebooks/input/20220730-sample/delawarepublic.hyperlinks.json
_notebooks/input/20220730-sample/desert_oracle.hyperlinks.json
_notebooks/input/20220730-sample/detroitnews.hyperlinks.json
_notebooks/input/20220730-sample/discovermag.hyperlinks.json
_notebooks/input/20220730-sample/discovery.hyperlinks.json
_notebooks/input/20220730-sample/dmregister.hyperlinks.json
_notebooks/input/20220730-sample/dn_no.hyperlinks.json
_notebooks/input/20220730-sample/drudge.hyperlinks.json
_notebooks/input/20220730-sample/eastbaytimes.hyperlinks.json
_notebooks/input/20220730-sample/edsource.hyperlinks.json
_notebooks/input/20220730-sample/eenewsupdates.hyperlinks.json
_notebooks/input/20220730-sample/el_universal_mx.hyperlinks.json
_notebooks/input/20220730-sample/eltiempo.hyperlinks.json
_notebooks/input/20220730-sample/eveningstandard.hyperlinks.json
_notebooks/input/20220730-sample/evroundtable.hyperlinks.json
_notebooks/input/20220730-sample/expressnews.hyperlinks.json
_notebooks/input/20220730-sample/fairmediawatch.hyperlinks.json
_notebooks/input/20220730-sample/fdrlst.hyperlinks.json
_notebooks/input/20220730-sample/fivethirtyeight.hyperlinks.json
_notebooks/input/20220730-sample/flintbeat.hyperlinks.json
_notebooks/input/20220730-sample/florida_bulldog.hyperlinks.json
_notebooks/input/20220730-sample/flphoenixnews.hyperlinks.json
_notebooks/input/20220730-sample/foreignpolicy.hyperlinks.json
_notebooks/input/20220730-sample/fortunemagazine.hyperlinks.json
_notebooks/input/20220730-sample/fortworthreport.hyperlinks.json
_notebooks/input/20220730-sample/fox29philly.hyperlinks.json
_notebooks/input/20220730-sample/fox5atlanta.hyperlinks.json
_notebooks/input/20220730-sample/foxla.hyperlinks.json
_notebooks/input/20220730-sample/foxsports.hyperlinks.json
_notebooks/input/20220730-sample/france24.hyperlinks.json
_notebooks/input/20220730-sample/france24_en.hyperlinks.json
_notebooks/input/20220730-sample/freebeacon.hyperlinks.json
_notebooks/input/20220730-sample/gainesvillesun.hyperlinks.json
_notebooks/input/20220730-sample/gcm_nf.hyperlinks.json
_notebooks/input/20220730-sample/gothamist.hyperlinks.json
_notebooks/input/20220730-sample/gwinnettdaily.hyperlinks.json
_notebooks/input/20220730-sample/harpers.hyperlinks.json
_notebooks/input/20220730-sample/hellgateny.hyperlinks.json
_notebooks/input/20220730-sample/hiddencityphila.hyperlinks.json
_notebooks/input/20220730-sample/houstonchron.hyperlinks.json
_notebooks/input/20220730-sample/hromadskeua.hyperlinks.json
_notebooks/input/20220730-sample/hyperlinks.zip
_notebooks/input/20220731-sample/nhpr.hyperlinks.json
_notebooks/input/20220731-sample/nikkei.hyperlinks.json
_notebooks/input/20220731-sample/novayagazeta_eu.hyperlinks.json
_notebooks/input/20220731-sample/ntdaily.hyperlinks.json
_notebooks/input/20220731-sample/nybooks.hyperlinks.json
_notebooks/input/20220731-sample/nysfocus.hyperlinks.json
_notebooks/input/20220731-sample/nytimes.hyperlinks.json
_notebooks/input/20220731-sample/objectivejrn.hyperlinks.json
_notebooks/input/20220731-sample/occrp.hyperlinks.json
_notebooks/input/20220731-sample/ocregister.hyperlinks.json
_notebooks/input/20220731-sample/okayplayer.hyperlinks.json
_notebooks/input/20220731-sample/onlineathens.hyperlinks.json
_notebooks/input/20220731-sample/oronline.hyperlinks.json
_notebooks/input/20220731-sample/osnepalnews.hyperlinks.json
_notebooks/input/20220731-sample/ottawacitizen.hyperlinks.json
_notebooks/input/20220731-sample/parisreview.hyperlinks.json
_notebooks/input/20220731-sample/people.hyperlinks.json
_notebooks/input/20220731-sample/pitchfork.hyperlinks.json
_notebooks/input/20220731-sample/pittsburghpg.hyperlinks.json
_notebooks/input/20220731-sample/platformer.hyperlinks.json
_notebooks/input/20220731-sample/politico.hyperlinks.json
_notebooks/input/20220731-sample/portlandmercury.hyperlinks.json
_notebooks/input/20220731-sample/postandcourier.hyperlinks.json
_notebooks/input/20220731-sample/powerlineus.hyperlinks.json
_notebooks/input/20220731-sample/prabhatkhabar.hyperlinks.json
_notebooks/input/20220731-sample/prensagrafica.hyperlinks.json
_notebooks/input/20220731-sample/pressenterprise.hyperlinks.json
_notebooks/input/20220731-sample/prismreports.hyperlinks.json
_notebooks/input/20220731-sample/propublica.hyperlinks.json
_notebooks/input/20220731-sample/protocol.hyperlinks.json
_notebooks/input/20220731-sample/publicintegrity.hyperlinks.json
_notebooks/input/20220731-sample/punjabkesari.hyperlinks.json
_notebooks/input/20220731-sample/qctimes.hyperlinks.json
_notebooks/input/20220731-sample/quintoelab.hyperlinks.json
_notebooks/input/20220731-sample/qz.hyperlinks.json
_notebooks/input/20220731-sample/reason.hyperlinks.json
_notebooks/input/20220731-sample/restofworld.hyperlinks.json
_notebooks/input/20220731-sample/reveal.hyperlinks.json
_notebooks/input/20220731-sample/reviewjournal.hyperlinks.json
_notebooks/input/20220731-sample/rgvfox.hyperlinks.json
_notebooks/input/20220731-sample/rianru.hyperlinks.json
_notebooks/input/20220731-sample/ringer.hyperlinks.json
_notebooks/input/20220731-sample/rollcall.hyperlinks.json
_notebooks/input/20220731-sample/romenewstribune.hyperlinks.json
_notebooks/input/20220731-sample/rpbreakingnews.hyperlinks.json
_notebooks/input/20220731-sample/rt_com.hyperlinks.json
_notebooks/input/20220731-sample/rtenews.hyperlinks.json
_notebooks/input/20220731-sample/sacbee_news.hyperlinks.json
_notebooks/input/20220731-sample/salon.hyperlinks.json
_notebooks/input/20220731-sample/scalawagmag.hyperlinks.json
_notebooks/input/20220731-sample/scsentinel.hyperlinks.json
_notebooks/input/20220731-sample/sdut.hyperlinks.json
_notebooks/input/20220731-sample/seattletimes.hyperlinks.json
_notebooks/input/20220731-sample/segodnya_online.hyperlinks.json
_notebooks/input/20220731-sample/seikyoofficial.hyperlinks.json
_notebooks/input/20220731-sample/semafor.hyperlinks.json
_notebooks/input/20220731-sample/setopati.hyperlinks.json
_notebooks/input/20220731-sample/sfchronicle.hyperlinks.json
_notebooks/input/20220731-sample/sgfcitizen.hyperlinks.json
_notebooks/input/20220731-sample/sltrib.hyperlinks.json
_notebooks/input/20220731-sample/sludge.hyperlinks.json
_notebooks/input/20220731-sample/source_nm.hyperlinks.json
_notebooks/input/20220731-sample/statesman.hyperlinks.json
_notebooks/input/20220731-sample/statnews.hyperlinks.json
_notebooks/input/20220731-sample/sternde.hyperlinks.json
_notebooks/input/20220731-sample/stlpublicradio.hyperlinks.json
_notebooks/input/20220731-sample/stltoday.hyperlinks.json
_notebooks/input/20220731-sample/strikewave.hyperlinks.json
_notebooks/input/20220731-sample/tass_agency.hyperlinks.json
_notebooks/input/20220731-sample/tb_times.hyperlinks.json
_notebooks/input/20220731-sample/teamtrace.hyperlinks.json
_notebooks/input/20220731-sample/techcrunch.hyperlinks.json
_notebooks/input/20220731-sample/techmeme.hyperlinks.json
_notebooks/input/20220731-sample/techreview.hyperlinks.json
_notebooks/input/20220731-sample/telegraphga.hyperlinks.json
_notebooks/input/20220731-sample/theappeal.hyperlinks.json
_notebooks/input/20220731-sample/thebafflermag.hyperlinks.json
_notebooks/input/20220731-sample/theblaze.hyperlinks.json
_notebooks/input/20220731-sample/thedailybeast.hyperlinks.json
_notebooks/input/20220731-sample/thedbk.hyperlinks.json
_notebooks/input/20220731-sample/thedispatch.hyperlinks.json
_notebooks/input/20220731-sample/thehill.hyperlinks.json
_notebooks/input/20220731-sample/thehilltimes.hyperlinks.json
_notebooks/input/20220731-sample/theinformation.hyperlinks.json
_notebooks/input/20220731-sample/theintercept.hyperlinks.json
_notebooks/input/20220731-sample/thejournal_ie.hyperlinks.json
_notebooks/input/20220731-sample/thelasentinel.hyperlinks.json
_notebooks/input/20220731-sample/thelensnola.hyperlinks.json
_notebooks/input/20220731-sample/themarkup.hyperlinks.json
_notebooks/input/20220731-sample/theobserver.hyperlinks.json
_notebooks/input/20220731-sample/thephilacitizen.hyperlinks.json
_notebooks/input/20220731-sample/thetorontosun.hyperlinks.json
_notebooks/input/20220731-sample/timesenterprise.hyperlinks.json
_notebooks/input/20220731-sample/timesofindia.hyperlinks.json
_notebooks/input/20220731-sample/torontostar.hyperlinks.json
_notebooks/input/20220731-sample/torrentfreak.hyperlinks.json
_notebooks/input/20220731-sample/townhallcom.hyperlinks.json
_notebooks/input/20220731-sample/tpm.hyperlinks.json
_notebooks/input/20220731-sample/truthout.hyperlinks.json
_notebooks/input/20220731-sample/ukrinform.hyperlinks.json
_notebooks/input/20220731-sample/unichicago.hyperlinks.json
_notebooks/input/20220731-sample/usweekly.hyperlinks.json
_notebooks/input/20220731-sample/uwogazette.hyperlinks.json
_notebooks/input/20220731-sample/vancouversun.hyperlinks.json
_notebooks/input/20220731-sample/vcstar.hyperlinks.json
_notebooks/input/20220731-sample/verge.hyperlinks.json
_notebooks/input/20220731-sample/vgnett.hyperlinks.json
_notebooks/input/20220731-sample/voguemagazine.hyperlinks.json
_notebooks/input/20220731-sample/voiceofoc.hyperlinks.json
_notebooks/input/20220731-sample/voiceofsandiego.hyperlinks.json
_notebooks/input/20220731-sample/voicesofbay.hyperlinks.json
_notebooks/input/20220731-sample/voxdotcom.hyperlinks.json
_notebooks/input/20220731-sample/vtdigger.hyperlinks.json
_notebooks/input/20220731-sample/wabenews.hyperlinks.json
_notebooks/input/20220731-sample/washingtonpost.hyperlinks.json
_notebooks/input/20220731-sample/wausauherald.hyperlinks.json
_notebooks/input/20220731-sample/wcfcourier.hyperlinks.json
_notebooks/input/20220731-sample/weatherchannel.hyperlinks.json
_notebooks/input/20220731-sample/wfaa.hyperlinks.json
_notebooks/input/20220731-sample/windowscentral.hyperlinks.json
_notebooks/input/20220731-sample/wired.hyperlinks.json
_notebooks/input/20220731-sample/worldnetdaily.hyperlinks.json
_notebooks/input/20220731-sample/wplglocal10.hyperlinks.json
_notebooks/input/20220731-sample/wral.hyperlinks.json
_notebooks/input/20220731-sample/wrblnews3.hyperlinks.json
_notebooks/input/20220731-sample/wsbtv.hyperlinks.json
_notebooks/input/20220731-sample/wsj.hyperlinks.json
_notebooks/input/20220731-sample/wttw.hyperlinks.json
_notebooks/input/20220731-sample/yorkdispatch.hyperlinks.json
_notebooks/input/20220731-sample/zeitonline.hyperlinks.json
_notebooks/input/20220731-sample/zerohedge.hyperlinks.json
_notebooks/input/20220731-sample/zn_ua.hyperlinks.json
_notebooks/output/path-and-text-model.pickle
_notebooks/output/path-only-model.pickle
_notebooks/output/wrong.csv
docs/Makefile
docs/Untitled File
docs/conf.py
docs/index.md
docs/make.bat
docs/requirements.txt
docs/_static/css/custom.css
docs/_templates/nav.html
storysniffer/__init__.py
storysniffer/path-and-text-model.pickle
storysniffer/path-only-model.pickle
storysniffer.egg-info/PKG-INFO
storysniffer.egg-info/SOURCES.txt
storysniffer.egg-info/dependency_links.txt
storysniffer.egg-info/requires.txt
storysniffer.egg-info/top_level.txt