timesearch/timesearch_modules/__init__.py

import argparse
import sys

from . import exceptions

# NOTE: Originally I wanted the docstring for each module to be within their
# file. However, this means that composing the global helptext would require
# importing those modules, which will subsequently import PRAW and a whole lot
# of other things. This made TS very slow to load which is okay when you're
# actually using it but really terrible when you're just viewing the help text.
DOCSTRING = '''
Timesearch
The subreddit archiver

The basics:
1. Collect a subreddit's submissions
    > timesearch.py timesearch -r subredditname

2. Collect the comments for those submissions
    > timesearch.py commentaugment -r subredditname

3. Stay up-to-date
    > timesearch.py livestream -r subredditname


Commands for collecting:
{timesearch}
{commentaugment}
{livestream}
{getstyles}
{getwiki}

Commands for processing:
{offline_reading}
{redmash}
{breakdown}
{mergedb}

TO SEE DETAILS ON EACH COMMAND, RUN
> timesearch.py <command>
'''

MODULE_DOCSTRINGS = {
    'breakdown': '''
breakdown:
    Give the comment / submission counts for users in a subreddit, or
    the subreddits that a user posts to.

    Automatically dumps into a <database>_breakdown.json file
    in the same directory as the database.

    > timesearch.py breakdown -r subredditname <flags>
    > timesearch.py breakdown -u username <flags>

    flags:
    -r "test" | --subreddit "test":
        The subreddit database to break down.

    -u "test" | --username "test":
        The username database to break down.

    --sort "name" | "submissions" | "comments" | "total_posts"
        Sort the output.
''',

    'commentaugment': '''
commentaugment:
    Collect comments on a subreddit or comments made by a user.

    > timesearch.py commentaugment -r subredditname <flags>
    > timesearch.py commentaugment -u username <flags>

    flags:
    -s "t3_xxxxxx" | --specific "t3_xxxxxx":
        Given a submission ID, t3_xxxxxx, scan only that submission.

    -l "update" | --lower "update":
        If a number - the unix timestamp to start at.
        If "update" - continue from latest comment in db.
        Default: update

    -up 1467460221 | --upper 1467460221:
        If a number - the unix timestamp to stop at.
        If not provided - stop at current time.
        Default: current time

    --dont_supplement:
        If provided, trust the pushshift data and do not fetch live copies
        from reddit.

    -v | --verbose:
        If provided, print extra information to the screen.
''',

    'getstyles': '''
getstyles:
    Collect the stylesheet, and css images.

    > timesearch.py getstyles -r subredditname
''',

    'getwiki': '''
getwiki:
    Collect all available wiki pages.

    > timesearch.py getwiki -r subredditname
''',

    'mergedb': '''
mergedb:
    Copy all new posts from one timesearch database into another.

    > timesearch mergedb --from redditdev1.db --to redditdev2.db

    flags:
    --from:
        The database file containing the posts you wish to copy.

    --to:
        The database file to which you will copy the posts.
        The database is modified in-place.
        Existing posts will be ignored and not updated.
''',

    'livestream': '''
livestream:
    Continously collect submissions and/or comments.

    > timesearch.py livestream -r subredditname <flags>
    > timesearch.py livestream -u username <flags>

    flags:
    -r "test" | --subreddit "test":
        The subreddit to collect from.

    -u "test" | --username "test":
        The redditor to collect from.

    -s | --submissions:
        If provided, do collect submissions. Otherwise don't.

    -c | --comments:
        If provided, do collect comments. Otherwise don't.

    If submissions and comments are BOTH left unspecified, then they will
    BOTH be collected.

    -v | --verbose:
        If provided, print extra information to the screen.

    -w 30 | --wait 30:
        The number of seconds to wait between cycles.

    -1 | --once:
        If provided, only do a single loop. Otherwise go forever.
''',

    'offline_reading': '''
offline_reading:
    Render submissions and comment threads to HTML via Markdown.

    > timesearch.py offline_reading -r subredditname <flags>
    > timesearch.py offline_reading -u username <flags>

    flags:
    -s "t3_xxxxxx" | --specific "t3_xxxxxx":
        Given a submission ID, t3_xxxxxx, render only that submission.
        Otherwise render every submission in the database.
''',

    'redmash': '''
redmash:
    Dump submission listings to a plaintext or HTML file.

    > timesearch.py redmash -r subredditname <flags>
    > timesearch.py redmash -u username <flags>

    flags:
    -r "test" | --subreddit "test":
        The subreddit database to dump

    -u "test" | --username "test":
        The username database to dump

    --html:
        Write HTML files instead of plain text.

    --offline:
        The links in the mash will point to the files generated by
        offline_reading. That is, `../offline_reading/fullname.html` instead
        of `http://redd.it/id`. This will NOT trigger offline_reading to
        generate the files now, so you must run that tool separately.

    -st 50 | --score_threshold 50:
        Only mash posts with at least this many points.
        Applies to ALL mashes!

    --all:
        Perform all of the mashes listed below.

    --date:
        Perform a mash sorted by date.

    --title:
        Perform a mash sorted by title.

    --score:
        Perform a mash sorted by score.

    --author:
        For subreddit databases only.
        Perform a mash sorted by author.

    --sub:
        For username databases only.
        Perform a mash sorted by subreddit.

    --flair:
        Perform a mash sorted by flair.

    examples:
        `timesearch redmash -r botwatch --date`
        does only the date file.

        `timesearch redmash -r botwatch --score --title`
        does both the score and title files.

        `timesearch redmash -r botwatch --score --score_threshold 50`
        only shows submissions with >= 50 points.

        `timesearch redmash -r botwatch --all`
        performs all of the different mashes.
''',

    'timesearch': '''
timesearch:
    Collect submissions from the subreddit across all of history, or
    Collect submissions by a user (as many as possible).

    > timesearch.py timesearch -r subredditname <flags>
    > timesearch.py timesearch -u username <flags>

    -r "test" | --subreddit "test":
        The subreddit to scan. Mutually exclusive with username.

    -u "test" | --username "test":
        The user to scan. Mutually exclusive with subreddit.

    -l "update" | --lower "update":
        If a number - the unix timestamp to start at.
        If "update" - continue from latest submission in db.
        Default: update

    -up 1467460221 | --upper 1467460221:
        If a number - the unix timestamp to stop at.
        If not provided - stop at current time.
        Default: current time

    --dont_supplement:
        If provided, trust the pushshift data and do not fetch live copies
        from reddit.

    -v | --verbose:
        If provided, print extra information to the screen.
''',
}


def docstring_preview(text):
    '''
    Return the brief description at the top of the text.
    User can get full text by looking at each specifically.
    '''
    return text.split('\n\n')[0]

def listget(li, index, fallback=None):
    try:
        return li[index]
    except IndexError:
        return fallback

def indent(text, spaces=4):
    spaces = ' ' * spaces
    return '\n'.join(spaces + line if line.strip() != '' else line for line in text.split('\n'))

docstring_headers = {
    key: indent(docstring_preview(value))
    for (key, value) in MODULE_DOCSTRINGS.items()
}

DOCSTRING = DOCSTRING.format(**docstring_headers)

####################################################################################################
####################################################################################################

def breakdown_gateway(args):
    from . import breakdown
    breakdown.breakdown_argparse(args)

def commentaugment_gateway(args):
    from . import commentaugment
    commentaugment.commentaugment_argparse(args)

def getstyles_gateway(args):
    from . import getstyles
    getstyles.getstyles_argparse(args)

def getwiki_gateway(args):
    from . import getwiki
    getwiki.getwiki_argparse(args)

def livestream_gateway(args):
    from . import livestream
    livestream.livestream_argparse(args)

def mergedb_gateway(args):
    from . import mergedb
    mergedb.mergedb_argparse(args)

def offline_reading_gateway(args):
    from . import offline_reading
    offline_reading.offline_reading_argparse(args)

def redmash_gateway(args):
    from . import redmash
    redmash.redmash_argparse(args)

def timesearch_gateway(args):
    from . import timesearch
    timesearch.timesearch_argparse(args)


parser = argparse.ArgumentParser()
subparsers = parser.add_subparsers()

p_breakdown = subparsers.add_parser('breakdown')
p_breakdown.add_argument('--sort', dest='sort', default=None)
p_breakdown.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_breakdown.add_argument('-u', '--user', dest='username', default=None)
p_breakdown.set_defaults(func=breakdown_gateway)

p_commentaugment = subparsers.add_parser('commentaugment')
p_commentaugment.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_commentaugment.add_argument('-s', '--specific', dest='specific_submission', default=None)
p_commentaugment.add_argument('-u', '--user', dest='username', default=None)
p_commentaugment.add_argument('-v', '--verbose', dest='verbose', action='store_true')
p_commentaugment.add_argument('--dont_supplement', dest='do_supplement', action='store_false')
p_commentaugment.add_argument('-l', '--lower', dest='lower', default='update')
p_commentaugment.add_argument('-up', '--upper', dest='upper', default=None)
p_commentaugment.set_defaults(func=commentaugment_gateway)

p_getstyles = subparsers.add_parser('getstyles')
p_getstyles.add_argument('-r', '--subreddit', dest='subreddit')
p_getstyles.set_defaults(func=getstyles_gateway)

p_getwiki = subparsers.add_parser('getwiki')
p_getwiki.add_argument('-r', '--subreddit', dest='subreddit')
p_getwiki.set_defaults(func=getwiki_gateway)

p_livestream = subparsers.add_parser('livestream')
p_livestream.add_argument('-1', '--once', dest='once', action='store_true')
p_livestream.add_argument('-c', '--comments', dest='comments', action='store_true')
p_livestream.add_argument('-l', '--limit', dest='limit', default=None)
p_livestream.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_livestream.add_argument('-s', '--submissions', dest='submissions', action='store_true')
p_livestream.add_argument('-u', '--user', dest='username', default=None)
p_livestream.add_argument('-v', '--verbose', dest='verbose', action='store_true')
p_livestream.add_argument('-w', '--wait', dest='sleepy', default=30)
p_livestream.set_defaults(func=livestream_gateway)

p_mergedb = subparsers.add_parser('mergedb')
p_mergedb.add_argument('--from', dest='from_db_path', required=True)
p_mergedb.add_argument('--to', dest='to_db_path', required=True)
p_mergedb.set_defaults(func=mergedb_gateway)

p_offline_reading = subparsers.add_parser('offline_reading')
p_offline_reading.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_offline_reading.add_argument('-s', '--specific', dest='specific_submission', default=None)
p_offline_reading.add_argument('-u', '--user', dest='username', default=None)
p_offline_reading.set_defaults(func=offline_reading_gateway)

p_redmash = subparsers.add_parser('redmash')
p_redmash.add_argument('--all', dest='do_all', action='store_true')
p_redmash.add_argument('--author', dest='do_author', action='store_true')
p_redmash.add_argument('--date', dest='do_date', action='store_true')
p_redmash.add_argument('--flair', dest='do_flair', action='store_true')
p_redmash.add_argument('--html', dest='html', action='store_true')
p_redmash.add_argument('--score', dest='do_score', action='store_true')
p_redmash.add_argument('--sub', dest='do_subreddit', action='store_true')
p_redmash.add_argument('--title', dest='do_title', action='store_true')
p_redmash.add_argument('--offline', dest='offline', action='store_true')
p_redmash.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_redmash.add_argument('-st', '--score_threshold', dest='score_threshold', default=0)
p_redmash.add_argument('-u', '--user', dest='username', default=None)
p_redmash.set_defaults(func=redmash_gateway)

p_timesearch = subparsers.add_parser('timesearch')
p_timesearch.add_argument('-l', '--lower', dest='lower', default='update')
p_timesearch.add_argument('-r', '--subreddit', dest='subreddit', default=None)
p_timesearch.add_argument('-u', '--user', dest='username', default=None)
p_timesearch.add_argument('-up', '--upper', dest='upper', default=None)
p_timesearch.add_argument('-v', '--verbose', dest='verbose', action='store_true')
p_timesearch.add_argument('--dont_supplement', dest='do_supplement', action='store_false')
p_timesearch.set_defaults(func=timesearch_gateway)

def main(argv):
    helpstrings = {'', 'help', '-h', '--help'}

    command = listget(argv, 0, '').lower()

    # The user did not enter a command, or entered something unrecognized.
    if command not in MODULE_DOCSTRINGS:
        print(DOCSTRING)
        if command == '':
            print('You are seeing the default help text because you did not choose a command.')
        elif command not in helpstrings:
            print('You are seeing the default help text because "%s" was not recognized' % command)
        return 1

    # The user entered a command, but no further arguments, or just help.
    argument = listget(argv, 1, '').lower()
    if argument in helpstrings:
        print(MODULE_DOCSTRINGS[command])
        return 1

    args = parser.parse_args(argv)
    try:
        args.func(args)
    except exceptions.DatabaseNotFound as e:
        message = str(e)
        message += '\nHave you used any of the other utilities to collect data?'
        print(message)
        return 1

    return 0

if __name__ == '__main__':
    raise SystemExit(main(sys.argv[1:]))
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`import argparse`
			`import sys`

			`from . import exceptions`

			`# NOTE: Originally I wanted the docstring for each module to be within their`
			`# file. However, this means that composing the global helptext would require`
			`# importing those modules, which will subsequently import PRAW and a whole lot`
			`# of other things. This made TS very slow to load which is okay when you're`
			`# actually using it but really terrible when you're just viewing the help text.`
			`DOCSTRING = '''`
			`Timesearch`
			`The subreddit archiver`

			`The basics:`
			`1. Collect a subreddit's submissions`
			`> timesearch.py timesearch -r subredditname`

			`2. Collect the comments for those submissions`
			`> timesearch.py commentaugment -r subredditname`

			`3. Stay up-to-date`
			`> timesearch.py livestream -r subredditname`


			`Commands for collecting:`
			`{timesearch}`
			`{commentaugment}`
			`{livestream}`
			`{getstyles}`
			`{getwiki}`

			`Commands for processing:`
			`{offline_reading}`
			`{redmash}`
			`{breakdown}`
			`{mergedb}`

			`TO SEE DETAILS ON EACH COMMAND, RUN`
			`> timesearch.py <command>`
			`'''`

			`MODULE_DOCSTRINGS = {`
			`'breakdown': '''`
			`breakdown:`
			`Give the comment / submission counts for users in a subreddit, or`
			`the subreddits that a user posts to.`

			`Automatically dumps into a <database>_breakdown.json file`
			`in the same directory as the database.`

Add missing <flags> to the breakdown docs. 2018-07-13 07:45:44 +00:00			`> timesearch.py breakdown -r subredditname <flags>`
			`> timesearch.py breakdown -u username <flags>`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00
			`flags:`
			`-r "test" \| --subreddit "test":`
			`The subreddit database to break down.`

			`-u "test" \| --username "test":`
			`The username database to break down.`

			`--sort "name" \| "submissions" \| "comments" \| "total_posts"`
			`Sort the output.`
			`''',`

			`'commentaugment': '''`
			`commentaugment:`
Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`Collect comments on a subreddit or comments made by a user.`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00
			`> timesearch.py commentaugment -r subredditname <flags>`
			`> timesearch.py commentaugment -u username <flags>`

			`flags:`
			`-s "t3_xxxxxx" \| --specific "t3_xxxxxx":`
			`Given a submission ID, t3_xxxxxx, scan only that submission.`

Allow commentaugment to take lower and upper as well. 2018-04-21 06:29:42 +00:00			`-l "update" \| --lower "update":`
			`If a number - the unix timestamp to start at.`
			`If "update" - continue from latest comment in db.`
			`Default: update`

			`-up 1467460221 \| --upper 1467460221:`
			`If a number - the unix timestamp to stop at.`
			`If not provided - stop at current time.`
			`Default: current time`

Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`--dont_supplement:`
			`If provided, trust the pushshift data and do not fetch live copies`
			`from reddit.`

Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`-v \| --verbose:`
Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`If provided, print extra information to the screen.`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`''',`

			`'getstyles': '''`
			`getstyles:`
			`Collect the stylesheet, and css images.`

			`> timesearch.py getstyles -r subredditname`
			`''',`

			`'getwiki': '''`
			`getwiki:`
			`Collect all available wiki pages.`

			`> timesearch.py getwiki -r subredditname`
			`''',`

			`'mergedb': '''`
			`mergedb:`
			`Copy all new posts from one timesearch database into another.`

			`> timesearch mergedb --from redditdev1.db --to redditdev2.db`

			`flags:`
			`--from:`
			`The database file containing the posts you wish to copy.`

			`--to:`
			`The database file to which you will copy the posts.`
			`The database is modified in-place.`
			`Existing posts will be ignored and not updated.`
			`''',`

			`'livestream': '''`
			`livestream:`
			`Continously collect submissions and/or comments.`

			`> timesearch.py livestream -r subredditname <flags>`
			`> timesearch.py livestream -u username <flags>`

			`flags:`
			`-r "test" \| --subreddit "test":`
			`The subreddit to collect from.`

			`-u "test" \| --username "test":`
			`The redditor to collect from.`

			`-s \| --submissions:`
			`If provided, do collect submissions. Otherwise don't.`

			`-c \| --comments:`
			`If provided, do collect comments. Otherwise don't.`

			`If submissions and comments are BOTH left unspecified, then they will`
			`BOTH be collected.`

			`-v \| --verbose:`
			`If provided, print extra information to the screen.`

			`-w 30 \| --wait 30:`
			`The number of seconds to wait between cycles.`

			`-1 \| --once:`
			`If provided, only do a single loop. Otherwise go forever.`
			`''',`

			`'offline_reading': '''`
			`offline_reading:`
			`Render submissions and comment threads to HTML via Markdown.`

			`> timesearch.py offline_reading -r subredditname <flags>`
			`> timesearch.py offline_reading -u username <flags>`

			`flags:`
			`-s "t3_xxxxxx" \| --specific "t3_xxxxxx":`
			`Given a submission ID, t3_xxxxxx, render only that submission.`
			`Otherwise render every submission in the database.`
			`''',`

			`'redmash': '''`
			`redmash:`
			`Dump submission listings to a plaintext or HTML file.`

			`> timesearch.py redmash -r subredditname <flags>`
			`> timesearch.py redmash -u username <flags>`

			`flags:`
			`-r "test" \| --subreddit "test":`
			`The subreddit database to dump`

			`-u "test" \| --username "test":`
			`The username database to dump`

			`--html:`
			`Write HTML files instead of plain text.`

Add argument --offline to redmash, points to offline_reading files. Previously, the files generated by offline_reading were difficult to use because there was no index file and the filenames are just ids. So now, the redmash can act as an index! 2020-01-06 04:51:31 +00:00			`--offline:`
			`The links in the mash will point to the files generated by`
			offline_reading. That is, `../offline_reading/fullname.html` instead
			of `http://redd.it/id`. This will NOT trigger offline_reading to
			`generate the files now, so you must run that tool separately.`

Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`-st 50 \| --score_threshold 50:`
			`Only mash posts with at least this many points.`
			`Applies to ALL mashes!`

			`--all:`
			`Perform all of the mashes listed below.`

			`--date:`
			`Perform a mash sorted by date.`

			`--title:`
			`Perform a mash sorted by title.`

			`--score:`
			`Perform a mash sorted by score.`

			`--author:`
			`For subreddit databases only.`
			`Perform a mash sorted by author.`

			`--sub:`
			`For username databases only.`
			`Perform a mash sorted by subreddit.`

			`--flair:`
			`Perform a mash sorted by flair.`

			`examples:`
			`timesearch redmash -r botwatch --date`
			`does only the date file.`

			`timesearch redmash -r botwatch --score --title`
			`does both the score and title files.`

			`timesearch redmash -r botwatch --score --score_threshold 50`
			`only shows submissions with >= 50 points.`

			`timesearch redmash -r botwatch --all`
			`performs all of the different mashes.`
			`''',`

			`'timesearch': '''`
			`timesearch:`
			`Collect submissions from the subreddit across all of history, or`
			`Collect submissions by a user (as many as possible).`

			`> timesearch.py timesearch -r subredditname <flags>`
			`> timesearch.py timesearch -u username <flags>`

			`-r "test" \| --subreddit "test":`
			`The subreddit to scan. Mutually exclusive with username.`

			`-u "test" \| --username "test":`
			`The user to scan. Mutually exclusive with subreddit.`

			`-l "update" \| --lower "update":`
			`If a number - the unix timestamp to start at.`
			`If "update" - continue from latest submission in db.`
			`Default: update`

			`-up 1467460221 \| --upper 1467460221:`
			`If a number - the unix timestamp to stop at.`
			`If not provided - stop at current time.`
			`Default: current time`

Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`--dont_supplement:`
			`If provided, trust the pushshift data and do not fetch live copies`
			`from reddit.`

			`-v \| --verbose:`
			`If provided, print extra information to the screen.`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`''',`
			`}`


			`def docstring_preview(text):`
			`'''`
			`Return the brief description at the top of the text.`
			`User can get full text by looking at each specifically.`
			`'''`
			`return text.split('\n\n')[0]`

			`def listget(li, index, fallback=None):`
			`try:`
			`return li[index]`
			`except IndexError:`
			`return fallback`

			`def indent(text, spaces=4):`
			`spaces = ' ' * spaces`
			`return '\n'.join(spaces + line if line.strip() != '' else line for line in text.split('\n'))`

			`docstring_headers = {`
			`key: indent(docstring_preview(value))`
			`for (key, value) in MODULE_DOCSTRINGS.items()`
			`}`

			`DOCSTRING = DOCSTRING.format(**docstring_headers)`

			`####################################################################################################`
			`####################################################################################################`

			`def breakdown_gateway(args):`
			`from . import breakdown`
			`breakdown.breakdown_argparse(args)`

			`def commentaugment_gateway(args):`
			`from . import commentaugment`
			`commentaugment.commentaugment_argparse(args)`

			`def getstyles_gateway(args):`
			`from . import getstyles`
			`getstyles.getstyles_argparse(args)`

			`def getwiki_gateway(args):`
			`from . import getwiki`
			`getwiki.getwiki_argparse(args)`

			`def livestream_gateway(args):`
			`from . import livestream`
			`livestream.livestream_argparse(args)`

			`def mergedb_gateway(args):`
			`from . import mergedb`
			`mergedb.mergedb_argparse(args)`

			`def offline_reading_gateway(args):`
			`from . import offline_reading`
			`offline_reading.offline_reading_argparse(args)`

			`def redmash_gateway(args):`
			`from . import redmash`
			`redmash.redmash_argparse(args)`

			`def timesearch_gateway(args):`
			`from . import timesearch`
			`timesearch.timesearch_argparse(args)`


			`parser = argparse.ArgumentParser()`
			`subparsers = parser.add_subparsers()`

			`p_breakdown = subparsers.add_parser('breakdown')`
			`p_breakdown.add_argument('--sort', dest='sort', default=None)`
			`p_breakdown.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_breakdown.add_argument('-u', '--user', dest='username', default=None)`
			`p_breakdown.set_defaults(func=breakdown_gateway)`

			`p_commentaugment = subparsers.add_parser('commentaugment')`
			`p_commentaugment.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_commentaugment.add_argument('-s', '--specific', dest='specific_submission', default=None)`
			`p_commentaugment.add_argument('-u', '--user', dest='username', default=None)`
			`p_commentaugment.add_argument('-v', '--verbose', dest='verbose', action='store_true')`
Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`p_commentaugment.add_argument('--dont_supplement', dest='do_supplement', action='store_false')`
Allow commentaugment to take lower and upper as well. 2018-04-21 06:29:42 +00:00			`p_commentaugment.add_argument('-l', '--lower', dest='lower', default='update')`
			`p_commentaugment.add_argument('-up', '--upper', dest='upper', default=None)`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`p_commentaugment.set_defaults(func=commentaugment_gateway)`

			`p_getstyles = subparsers.add_parser('getstyles')`
			`p_getstyles.add_argument('-r', '--subreddit', dest='subreddit')`
			`p_getstyles.set_defaults(func=getstyles_gateway)`

			`p_getwiki = subparsers.add_parser('getwiki')`
			`p_getwiki.add_argument('-r', '--subreddit', dest='subreddit')`
			`p_getwiki.set_defaults(func=getwiki_gateway)`

			`p_livestream = subparsers.add_parser('livestream')`
			`p_livestream.add_argument('-1', '--once', dest='once', action='store_true')`
			`p_livestream.add_argument('-c', '--comments', dest='comments', action='store_true')`
			`p_livestream.add_argument('-l', '--limit', dest='limit', default=None)`
			`p_livestream.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_livestream.add_argument('-s', '--submissions', dest='submissions', action='store_true')`
			`p_livestream.add_argument('-u', '--user', dest='username', default=None)`
			`p_livestream.add_argument('-v', '--verbose', dest='verbose', action='store_true')`
			`p_livestream.add_argument('-w', '--wait', dest='sleepy', default=30)`
			`p_livestream.set_defaults(func=livestream_gateway)`

			`p_mergedb = subparsers.add_parser('mergedb')`
			`p_mergedb.add_argument('--from', dest='from_db_path', required=True)`
			`p_mergedb.add_argument('--to', dest='to_db_path', required=True)`
			`p_mergedb.set_defaults(func=mergedb_gateway)`

			`p_offline_reading = subparsers.add_parser('offline_reading')`
			`p_offline_reading.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_offline_reading.add_argument('-s', '--specific', dest='specific_submission', default=None)`
			`p_offline_reading.add_argument('-u', '--user', dest='username', default=None)`
			`p_offline_reading.set_defaults(func=offline_reading_gateway)`

			`p_redmash = subparsers.add_parser('redmash')`
			`p_redmash.add_argument('--all', dest='do_all', action='store_true')`
			`p_redmash.add_argument('--author', dest='do_author', action='store_true')`
			`p_redmash.add_argument('--date', dest='do_date', action='store_true')`
			`p_redmash.add_argument('--flair', dest='do_flair', action='store_true')`
			`p_redmash.add_argument('--html', dest='html', action='store_true')`
			`p_redmash.add_argument('--score', dest='do_score', action='store_true')`
			`p_redmash.add_argument('--sub', dest='do_subreddit', action='store_true')`
			`p_redmash.add_argument('--title', dest='do_title', action='store_true')`
Add argument --offline to redmash, points to offline_reading files. Previously, the files generated by offline_reading were difficult to use because there was no index file and the filenames are just ids. So now, the redmash can act as an index! 2020-01-06 04:51:31 +00:00			`p_redmash.add_argument('--offline', dest='offline', action='store_true')`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`p_redmash.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_redmash.add_argument('-st', '--score_threshold', dest='score_threshold', default=0)`
			`p_redmash.add_argument('-u', '--user', dest='username', default=None)`
			`p_redmash.set_defaults(func=redmash_gateway)`

			`p_timesearch = subparsers.add_parser('timesearch')`
			`p_timesearch.add_argument('-l', '--lower', dest='lower', default='update')`
			`p_timesearch.add_argument('-r', '--subreddit', dest='subreddit', default=None)`
			`p_timesearch.add_argument('-u', '--user', dest='username', default=None)`
			`p_timesearch.add_argument('-up', '--upper', dest='upper', default=None)`
Integrate with Pushshift.io to restore timesearch. And improve commentaugment. 2018-04-10 02:53:53 +00:00			`p_timesearch.add_argument('-v', '--verbose', dest='verbose', action='store_true')`
			`p_timesearch.add_argument('--dont_supplement', dest='do_supplement', action='store_false')`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`p_timesearch.set_defaults(func=timesearch_gateway)`

			`def main(argv):`
			`helpstrings = {'', 'help', '-h', '--help'}`

			`command = listget(argv, 0, '').lower()`

			`# The user did not enter a command, or entered something unrecognized.`
			`if command not in MODULE_DOCSTRINGS:`
			`print(DOCSTRING)`
			`if command == '':`
			`print('You are seeing the default help text because you did not choose a command.')`
			`elif command not in helpstrings:`
			`print('You are seeing the default help text because "%s" was not recognized' % command)`
			`return 1`

			`# The user entered a command, but no further arguments, or just help.`
			`argument = listget(argv, 1, '').lower()`
			`if argument in helpstrings:`
			`print(MODULE_DOCSTRINGS[command])`
			`return 1`

			`args = parser.parse_args(argv)`
			`try:`
			`args.func(args)`
Start exception hierarchy; rename DBNotFound to DatabaseNotFound. 2017-12-13 22:07:52 +00:00			`except exceptions.DatabaseNotFound as e:`
			`message = str(e)`
Initial migratory commit from voussoir/reddit. 2017-11-14 03:13:19 +00:00			`message += '\nHave you used any of the other utilities to collect data?'`
			`print(message)`
			`return 1`

			`return 0`

			`if __name__ == '__main__':`
			`raise SystemExit(main(sys.argv[1:]))`