else

2016-08-12 17:26:12 -07:00 · 2016-08-12 17:26:12 -07:00 · c491e417f5
commit c491e417f5
parent 53645b0123
5 changed files with 240 additions and 93 deletions
--- a/Javascript/videotiles.js
+++ b/Javascript/videotiles.js
@ -0,0 +1,114 @@
+javascript:
+
+CSS = ""
+ "* {margin: 0; padding: 0}"
+ "html {height: 95%}"
+ "body {height: 100%; background-color: #000}"
+ "div { display:inline-block; }"
+ "video {"
+ "  min-width: 100%;"
+ "  min-height: 100%;"
+ "  max-width: 100%;"
+ "  max-height: 100%;"
+ "  overflow: hidden;"
+ "}"
+;
+
+var VIDEO_TYPES = ["\\.mp4", "\\.m4v", "\\.webm", "\\.ogv"].join("|");
+
+function apply_css()
+{
+    console.log("applying CSS");
+    var css = document.createElement("style");
+    css.innerHTML = CSS;
+    document.head.appendChild(css);
+}
+
+function get_media_links()
+{
+    var anchors = document.getElementsByTagName("a");
+    var media_links = [];
+    for (var index = 0; index < anchors.length; index += 1)
+    {
+        var anchor = anchors[index];
+        if (anchor.href.match(VIDEO_TYPES))
+        {
+            media_links.push(anchor.href);
+        }
+    }
+    return media_links;
+}
+
+function clear_page()
+{
+    /* Remove EVERYTHING */
+    console.log("clearing page");
+    document.removeChild(document.documentElement);
+
+    var html = document.createElement("html");
+    document.appendChild(html);
+
+    var head = document.createElement("head");
+    html.appendChild(head);
+
+    var body = document.createElement("body");
+    html.appendChild(body);
+
+    document.documentElement = html;
+    return true;
+}
+
+function create_video_players(width, height)
+{
+    var css_width = (100 / width).toString() + "%";
+    var css_height = (100 / height).toString() + "%";
+    console.log(css_width);
+
+    var players = [];
+    for (var index = 0; index < width * height; index += 1)
+    {
+        var player_holder = document.createElement("div");
+        var player = document.createElement("video");
+        player_holder.style.width = css_width;
+        player_holder.style.height = css_height;
+        player.holder = player_holder;
+        players.push(player);
+        player_holder.appendChild(player);
+        document.body.appendChild(player_holder);
+    }
+    return players;
+}
+
+function swap_source(player, source_list)
+{
+    var index = Math.floor(Math.random() * source_list.length);
+    var href = source_list[index];
+    player.pause();
+    player.src = href;
+    player.load();
+    player.play();
+}
+
+function main()
+{
+    var WIDTH = 3;
+    var HEIGHT = 3;
+    var MEDIAS = get_media_links();
+
+    clear_page();
+    apply_css();
+
+    var PLAYERS = create_video_players(WIDTH, HEIGHT);
+    function ended_callback()
+    {
+        swap_source(this, MEDIAS);
+    }
+    for (var index = 0; index < PLAYERS.length; index += 1)
+    {
+        var player = PLAYERS[index];
+        player.addEventListener("ended", ended_callback);
+        swap_source(player, MEDIAS);
+    }
+}
+
+main();
--- a/OpenDirDL/README.md
+++ b/OpenDirDL/README.md
@ -7,6 +7,11 @@ Requires `pip install beautifulsoup4`

 See inside opendirdl.py for usage instructions.

+- 2016 08 10
+    - Fixed bug in smart_insert caused by 404's being considered falsey, triggering the 'one and only one' exception.
+    - Fixed bug in smart_insert where 404'd URLs were not being deleted from the database.
+    - Added clickable links to each directory on HTML tree pages.
+
 - 2016 08 02
    - Removed the usage of div IDs on the Tree pages by making the collapse button use `this.nextSibling`.
    - Rewrote `build_file_tree` with a way simpler algorithm.
--- a/OpenDirDL/opendirdl.py
+++ b/OpenDirDL/opendirdl.py
@ -140,10 +140,10 @@ DOWNLOAD_CHUNK = 16 * bytestring.KIBIBYTE

 UNKNOWN_SIZE_STRING = '???'

-# When doing a basic scan, we will not send HEAD requests to URLs that end in these strings,
-# because they're probably files.
-# This isn't meant to be a comprehensive filetype library, but it covers enough of the
-# typical opendir to speed things up.
+# When doing a basic scan, we will not send HEAD requests to URLs that end in
+# these strings, because they're probably files.
+# This isn't meant to be a comprehensive filetype library, but it covers
+# enough of the typical opendir to speed things up.
 SKIPPABLE_FILETYPES = [
 '.aac',
 '.avi',
@ -192,7 +192,8 @@ BLACKLISTED_FILENAMES = [
 ]

 # oh shit
-HTML_TREE_HEADER = '''
+HTML_TREE_HEAD = '''
+<head>
 <meta charset="UTF-8">

 <script type="text/javascript">
@ -215,12 +216,7 @@ function collapse(div)
    font-family: Consolas;
 }

-button
-{
-    display: block;
-}
-
-div
+.directory_even, .directory_odd
 {
    padding: 10px;
    padding-left: 15px;
@ -239,8 +235,18 @@ div
    background-color: #eee;
 }
 </style>
+</head>
 '''

+HTML_FORMAT_DIRECTORY = '''
+<div class="buttonbox">
+<button onclick="collapse(this.parentElement.nextElementSibling)">{name} ({size})</button>
+{directory_anchor}
+</div>
+<div class="{css}" style="display:none">
+'''.replace('\n', '')
+HTML_FORMAT_FILE = '<a href="{url}">{name} ({size})</a><br>'
+
 DB_INIT = '''
 CREATE TABLE IF NOT EXISTS urls(
    url TEXT,
@ -259,7 +265,6 @@ SQL_CONTENT_LENGTH = 2
 SQL_CONTENT_TYPE = 3
 SQL_DO_DOWNLOAD = 4

-
 UNMEASURED_WARNING = '''
 Note: %d files do not have a stored Content-Length.
 Run `measure` with `-f`|`--fullscan` or `-n`|`--new_only` to HEAD request
@ -278,7 +283,7 @@ class Walker:
        self.walkurl = walkurl

        if databasename in (None, ''):
-            domain = url_to_filepath(self.walkurl)['root']
+            domain = url_split(self.walkurl)['root']
            databasename = domain + '.db'
            databasename = databasename.replace(':', '#')
        self.databasename = databasename
@ -439,7 +444,7 @@ class TreeNode:
        self.children = {}

    def __eq__(self, other):
-        return isinstance(other, Treenode) and self.abspath() == other.abspath()
+        return isinstance(other, TreeNode) and self.abspath() == other.abspath()

    def __getitem__(self, key):
        return self.children[key]
@ -470,8 +475,6 @@ class TreeNode:
        return other_node

    def check_child_availability(self, identifier):
-        if ':' in identifier:
-            raise TreeInvalidIdentifier('Only roots may have a colon')
        if identifier in self.children:
            raise TreeExistingChild('Node %s already has child %s' % (self.identifier, identifier))

@ -526,7 +529,7 @@ def build_file_tree(databasename):
        {
            'url': item[SQL_URL],
            'size': item[SQL_CONTENT_LENGTH],
-            'path': path_form.format(**url_to_filepath(item[SQL_URL])).split('\\'),
+            'path_parts': path_form.format(**url_split(item[SQL_URL])).split('\\'),
        }
        for item in all_items
    ]
@ -536,6 +539,7 @@ def build_file_tree(databasename):
        'item_type': 'directory',
        'name': databasename,
    }
+    scheme = url_split(all_items[0]['url'])['scheme']
    tree = TreeNode(databasename, data=root_data)
    tree.unsorted_children = all_items
    node_queue = set()
@ -546,12 +550,12 @@ def build_file_tree(databasename):
    # directories. Those nodes receive all subdirectories, and repeat.
    while len(node_queue) > 0:
        node = node_queue.pop()
-        for to_sort in node.unsorted_children:
-            path = to_sort['path']
-            # Create a new node for the directory, path[0]
-            # path[1:] is assigned to that node to be divided next.
-            child_identifier = path.pop(0)
-            child_identifier = child_identifier.replace(':', '#')
+        for new_child_data in node.unsorted_children:
+            path_parts = new_child_data['path_parts']
+            # Create a new node for the directory, path_parts[0]
+            # path_parts[1:] is assigned to that node to be divided next.
+            child_identifier = path_parts.pop(0)
+            #child_identifier = child_identifier.replace(':', '#')

            child = node.children.get(child_identifier, None)
            if not child:
@ -559,15 +563,21 @@ def build_file_tree(databasename):
                child.unsorted_children = []
                node.add_child(child)

-            child.data['url'] = to_sort['url']
            child.data['name'] = child_identifier
-            if len(path) > 0:
+            if len(path_parts) > 0:
                child.data['item_type'] = 'directory'
-                child.unsorted_children.append(to_sort)
+                child.unsorted_children.append(new_child_data)
                node_queue.add(child)
            else:
                child.data['item_type'] = 'file'
-                child.data['size'] = to_sort['size']
+                child.data['size'] = new_child_data['size']
+                child.data['url'] = new_child_data['url']
+        if node.parent is None:
+            continue
+        elif node.parent == tree:
+            node.data['url'] = scheme + '://' + node.identifier
+        else:
+            node.data['url'] = node.parent.data['url'] + '/' + node.identifier

        del node.unsorted_children

@ -670,12 +680,21 @@ def recursive_print_node(node, depth=0, use_html=False, output_file=None):
    if use_html:
        css_class = 'directory_even' if depth % 2 == 0 else 'directory_odd'
        if node.data['item_type'] == 'directory':
-            line = '<button onclick="collapse(this.nextSibling)">{name} ({size})</button>'
-            line += '<div class="{css}" style="display:none">'
-            line = line.format(name=node.data['name'], size=size, css=css_class)
+            directory_url = node.data.get('url')
+            directory_anchor = '<a href="{url}">►</a>' if directory_url else ''
+            directory_anchor = directory_anchor.format(url=directory_url)
+            line = HTML_FORMAT_DIRECTORY.format(
+                css=css_class,
+                directory_anchor=directory_anchor,
+                name=node.data['name'],
+                size=size,
+            )
        else:
-            line = '<a href="{url}">{name} ({size})</a><br>'
-            line = line.format(url=node.data['url'], name=node.data['name'], size=size)
+            line = HTML_FORMAT_FILE.format(
+                name=node.data['name'],
+                size=size,
+                url=node.data['url'],
+            )
    else:
        line = '{space}{bar}{name} : ({size})'
        line = line.format(
@ -697,6 +716,7 @@ def recursive_print_node(node, depth=0, use_html=False, output_file=None):

    if node.data['item_type'] == 'directory':
        if use_html:
+            # Close the directory div
            write('</div>', output_file)
        else:
            # This helps put some space between sibling directories
@ -713,7 +733,7 @@ def smart_insert(sql, cur, url=None, head=None, commit=True):
    INSERT or UPDATE the appropriate entry, or DELETE if the head
    shows a 403 / 404.
    '''
-    if bool(url) is bool(head):
+    if bool(url) is bool(head) and not isinstance(head, requests.Response):
        raise ValueError('One and only one of `url` or `head` is necessary.')

    if url is not None:
@ -722,6 +742,7 @@ def smart_insert(sql, cur, url=None, head=None, commit=True):
        content_type = None

    elif head is not None:
+        url = head.url
        # When doing a full scan, we get a Response object.
        if head.status_code in [403, 404]:
            cur.execute('DELETE FROM urls WHERE url == ?', [url])
@ -735,7 +756,7 @@ def smart_insert(sql, cur, url=None, head=None, commit=True):
                content_length = int(content_length)
            content_type = head.headers.get('Content-Type', None)

-    basename = url_to_filepath(url)['filename']
+    basename = url_split(url)['filename']
    basename = urllib.parse.unquote(basename)
    do_download = True

@ -759,7 +780,7 @@ def smart_insert(sql, cur, url=None, head=None, commit=True):
        sql.commit()
    return data

-def url_to_filepath(text):
+def url_split(text):
    text = urllib.parse.unquote(text)
    parts = urllib.parse.urlsplit(text)
    if any(part == '' for part in [parts.scheme, parts.netloc]):
@ -852,7 +873,7 @@ def download(
        # on their own.
        cur.execute('SELECT url FROM urls LIMIT 1')
        url = cur.fetchone()[0]
-        outputdir = url_to_filepath(url)['root']
+        outputdir = url_split(url)['root']

    if isinstance(bytespersecond, str):
        bytespersecond = bytestring.parsebytes(bytespersecond)
@ -861,7 +882,7 @@ def download(
    for fetch in fetch_generator(cur):
        url = fetch[SQL_URL]

-        url_filepath = url_to_filepath(url)
+        url_filepath = url_split(url)
        folder = os.path.join(outputdir, url_filepath['folder'])
        os.makedirs(folder, exist_ok=True)

@ -1012,7 +1033,7 @@ def measure(databasename, fullscan=False, new_only=False):

    items = cur.fetchall()

-    filecount = 0
+    filecount = len(items)
    unmeasured_file_count = 0

    for fetch in items:
@ -1023,21 +1044,27 @@ def measure(databasename, fullscan=False, new_only=False):
            head = do_head(url, raise_for_status=False)
            fetch = smart_insert(sql, cur, head=head, commit=True)
            size = fetch[SQL_CONTENT_LENGTH]
-            if size is None:
-                write('"%s" is not revealing Content-Length' % url)
-                size = 0

-
-        elif fetch[SQL_CONTENT_LENGTH] is None:
+        elif size is None:
+            # Unmeasured and no intention to measure.
            unmeasured_file_count += 1
            size = 0

+        if size is None:
+            # Unmeasured even though we tried the head request.
+            write('"%s" is not revealing Content-Length' % url)
+            size = 0
+
        totalsize += size
-        filecount += 1

    sql.commit()
-    short_string = bytestring.bytestring(totalsize)
-    totalsize_string = '{} ({:,} bytes) in {:,} files'.format(short_string, totalsize, filecount)
+    size_string = bytestring.bytestring(totalsize)
+    totalsize_string = '{size_short} ({size_exact:,} bytes) in {filecount:,} files'
+    totalsize_string = totalsize_string.format(
+        size_short=size_string,
+        size_exact=totalsize,
+        filecount=filecount,
+    )
    write(totalsize_string)
    if unmeasured_file_count > 0:
        write(UNMEASURED_WARNING % unmeasured_file_count)
@ -1078,7 +1105,9 @@ def tree(databasename, output_filename=None):
        use_html = False

    if use_html:
-        write(HTML_TREE_HEADER, output_file)
+        write('<!DOCTYPE html>\n<html>', output_file)
+        write(HTML_TREE_HEAD, output_file)
+        write('<body>', output_file)

    size_details = recursive_get_size(tree)
    recursive_print_node(tree, use_html=use_html, output_file=output_file)
@ -1086,6 +1115,8 @@ def tree(databasename, output_filename=None):
        write(UNMEASURED_WARNING % size_details['unmeasured'], output_file)

    if output_file is not None:
+        if use_html:
+            write('</body>\n</html>', output_file)
        output_file.close()
    return tree

--- a/Pathclass/pathclass.py
+++ b/Pathclass/pathclass.py
@ -13,6 +13,9 @@ class Path:
    def __contains__(self, other):
        return other.absolute_path.startswith(self.absolute_path)

+    def __eq__(self, other):
+        return hasattr(other, 'absolute_path') and self.absolute_path == other.absolute_path
+
    def __hash__(self):
        return hash(self.absolute_path)

@ -75,31 +78,31 @@ def get_path_casing(path):
    (drive, subpath) = os.path.splitdrive(path)
    subpath = subpath.lstrip(os.sep)

-    def patternize(piece):
-        '''
-        Create a pattern like "[u]ser" from "user", forcing glob to look up the
-        correct path name, and guaranteeing that the only result will be the correct path.
-
-        Special cases are:
-            !, because in glob syntax, [!x] tells glob to look for paths that don't contain
-                "x". [!] is invalid syntax, so we pick the first non-! character to put
-                in the brackets.
-            [, because this starts a capture group
-        '''
-        piece = glob.escape(piece)
-        for character in piece:
-            if character not in '![]':
-                replacement = '[%s]' % character
-                #print(piece, character, replacement)
-                piece = piece.replace(character, replacement, 1)
-                break
-        return piece
-
-    pattern = [patternize(piece) for piece in subpath.split(os.sep)]
+    pattern = [glob_patternize(piece) for piece in subpath.split(os.sep)]
    pattern = os.sep.join(pattern)
    pattern = drive.upper() + os.sep + pattern
    #print(pattern)
    try:
        return glob.glob(pattern)[0]
    except IndexError:
-        return path
+        return path
+
+def glob_patternize(piece):
+    '''
+    Create a pattern like "[u]ser" from "user", forcing glob to look up the
+    correct path name, while guaranteeing that the only result will be the correct path.
+
+    Special cases are:
+        !, because in glob syntax, [!x] tells glob to look for paths that don't contain
+            "x". [!] is invalid syntax, so we pick the first non-! character to put
+            in the brackets.
+        [, because this starts a capture group
+    '''
+    piece = glob.escape(piece)
+    for character in piece:
+        if character not in '![]':
+            replacement = '[%s]' % character
+            #print(piece, character, replacement)
+            piece = piece.replace(character, replacement, 1)
+            break
+    return piece
--- a/SpinalTap/spinal.py
+++ b/SpinalTap/spinal.py
@ -52,7 +52,7 @@ def callback_v1(fpobj, written_bytes, total_bytes):
        ends = '\n'
    else:
        ends = ''
-    percent = (100 * written_bytes) / total_bytes
+    percent = (100 * written_bytes) / max(total_bytes, 1)
    percent = '%07.3f' % percent
    written = '{:,}'.format(written_bytes)
    total = '{:,}'.format(total_bytes)
@ -196,17 +196,13 @@ def copy_dir(
        m += '`destination_new_root` can be passed.'
        raise ValueError(m)

-    source = pathclass.get_path_casing(source)
    source = str_to_fp(source)

    if destination_new_root is not None:
        destination = new_root(source, destination_new_root)
    destination = str_to_fp(destination)

-    callback_directory = callback_directory or do_nothing
-    callback_verbose = callback_verbose or do_nothing
-
-    if is_subfolder(source, destination):
+    if destination in source:
        raise RecursiveDirectory(source, destination)

    if not source.is_dir:
@ -220,6 +216,8 @@ def copy_dir(
    else:
        total_bytes = 0

+    callback_directory = callback_directory or do_nothing
+    callback_verbose = callback_verbose or do_nothing
    bytes_per_second = limiter_or_none(bytes_per_second)
    files_per_second = limiter_or_none(files_per_second)

@ -350,7 +348,6 @@ def copy_file(
        m += '`destination_new_root` can be passed'
        raise ValueError(m)

-    source = pathclass.get_path_casing(source)
    source = str_to_fp(source)

    if destination_new_root is not None:
@ -370,13 +367,11 @@ def copy_file(

    # Determine overwrite
    if destination.exists:
-        destination_modtime = destination.stat.st_mtime
-
        if overwrite_old is False:
            return [destination, 0]

        source_modtime = source.stat.st_mtime
-        if source_modtime == destination_modtime:
+        if source_modtime == destination.stat.st_mtime:
            return [destination, 0]

    # Copy
@ -460,6 +455,8 @@ def is_xor(*args):
    return [bool(a) for a in args].count(True) == 1

 def limiter_or_none(value):
+    if isinstance(value, str):
+        value = bytestring.parsebytes(value)
    if isinstance(value, ratelimiter.Ratelimiter):
        limiter = value
    elif value is not None:
@ -506,7 +503,7 @@ def walk_generator(
        exclude_filenames=None,
    ):
    '''
-    Yield Path objects from the file tree similar to os.walk.
+    Yield Path objects for files in the file tree, similar to os.walk.

    callback_exclusion:
        This function will be called when a file or directory is excluded with
@ -563,31 +560,28 @@ def walk_generator(
    # This is a recursion-free workplace.
    # Thank you for your cooperation.
    while len(directory_queue) > 0:
-        location = directory_queue.popleft()
-        callback_verbose('listdir: %s' % location)
-        contents = os.listdir(location)
+        current_location = directory_queue.popleft()
+        callback_verbose('listdir: %s' % current_location)
+        contents = os.listdir(current_location)
        callback_verbose('received %d items' % len(contents))

        directories = []
        for base_name in contents:
-            absolute_name = os.path.join(location, base_name)
+            absolute_name = os.path.join(current_location, base_name)

            if os.path.isdir(absolute_name):
-                if normalize(absolute_name) in exclude_directories:
-                    callback_exclusion(absolute_name, 'directory')
-                    continue
-
-                if normalize(base_name) in exclude_directories:
+                exclude = normalize(absolute_name) in exclude_directories
+                exclude |= normalize(base_name) in exclude_directories
+                if exclude:
                    callback_exclusion(absolute_name, 'directory')
                    continue

                directories.append(absolute_name)

            else:
-                if normalize(base_name) in exclude_filenames:
-                    callback_exclusion(absolute_name, 'file')
-                    continue
-                if normalize(absolute_name) in exclude_filenames:
+                exclude = normalize(absolute_name) in exclude_filenames
+                exclude |= normalize(base_name) in exclude_filenames
+                if exclude:
                    callback_exclusion(absolute_name, 'file')
                    continue