From da0624f40eefbb2d15a222ba501c058fc5a49dfc Mon Sep 17 00:00:00 2001 From: libertysoft3 <31760410+libertysoft3@users.noreply.github.com> Date: Tue, 30 Jun 2020 03:24:20 -0700 Subject: [PATCH] Update README.md --- README.md | 24 ++++++++++++------------ 1 file changed, 12 insertions(+), 12 deletions(-) diff --git a/README.md b/README.md index e6ecae7..92dce99 100644 --- a/README.md +++ b/README.md @@ -6,26 +6,26 @@ pulls reddit data from the [pushshift](https://github.com/pushshift/api) api and requires python 3 on linux, OSX, or Windows - sudo apt-get install pip - pip install psaw - git clone https://github.com/chid/snudown - cd snudown - sudo python setup.py install - cd .. - git clone [this repo] - cd reddit-html-archiver - chmod u+x *.py + $ sudo apt-get install pip + $ pip install psaw + $ git clone https://github.com/chid/snudown + $ cd snudown + $ sudo python setup.py install + $ cd .. + $ git clone [this repo] + $ cd reddit-html-archiver + $ chmod u+x *.py Windows users may need to run - chcp 65001 - set PYTHONIOENCODING=utf-8 + > chcp 65001 + > set PYTHONIOENCODING=utf-8 before running `fetch_links.py` or `write_html.py` to resolve encoding errors such as 'codec can't encode character'. ### fetch reddit data -data is fetched by subreddit and date range and is stored as csv files in `data`. You may need to explicitly run the script python3 if it is not the default on your system. +data is fetched by subreddit and date range and is stored as csv files in `data`. You may need to explicitly run the script with python3 if it is not the default on your system. $ python3 ./fetch_links.py politics 2017-1-1 2017-2-1 # or add some link/post filtering to download less data