utility.py 1.2 KB
Newer Older
1
"""Contains data helper functions."""
2 3 4 5 6
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import json
7
import codecs
8 9 10


def read_manifest(manifest_path, max_duration=float('inf'), min_duration=0.0):
11
    """Load and parse manifest file.
12

13 14 15
    Instances with durations outside [min_duration, max_duration] will be
    filtered out.

16
    :param manifest_path: Manifest file to load and parse.
17 18 19 20 21 22 23 24 25
    :type manifest_path: basestring
    :param max_duration: Maximal duration in seconds for instance filter.
    :type max_duration: float
    :param min_duration: Minimal duration in seconds for instance filter.
    :type min_duration: float
    :return: Manifest parsing results. List of dict.
    :rtype: list
    :raises IOError: If failed to parse the manifest.
    """
26
    manifest = []
27
    for json_line in codecs.open(manifest_path, 'r', 'utf-8'):
28 29 30 31 32 33 34 35
        try:
            json_data = json.loads(json_line)
        except Exception as e:
            raise IOError("Error reading manifest: %s" % str(e))
        if (json_data["duration"] <= max_duration and
                json_data["duration"] >= min_duration):
            manifest.append(json_data)
    return manifest