Merge branch 'develop'

2026-07-09 02:24:01 +01:00 · 2017-04-06 10:11:01 +12:00
parent debc65db5d 437d33e7a8
commit e1e361a46e
124 changed files with 17497 additions and 6588 deletions
@@ -11,7 +11,6 @@ cache:
    - lib

 python:
-  - "2.6"
  - "2.7"

 install:
@@ -1,4 +1,4 @@
-##![Headphones Logo](https://github.com/rembo10/headphones/raw/master/data/images/headphoneslogo.png) Headphones
+## ![Headphones Logo](https://github.com/rembo10/headphones/raw/master/data/images/headphoneslogo.png) Headphones

 [![Build Status](https://travis-ci.org/rembo10/headphones.svg?branch=master)](https://travis-ci.org/rembo10/headphones)
 [![Build Status](https://img.shields.io/travis/rembo10/headphones/develop.svg?label=develop%20branch%20build)](https://travis-ci.org/rembo10/headphones)
@@ -678,24 +678,20 @@

                                <fieldset>
                                    <div class="row checkbox left">
-                                        <input id="use_pth" type="checkbox" class="bigcheck" name="use_pth" value="1" ${config['use_pth']} /><label for="use_pth"><span class="option">PassTheHeadphones.me</span></label>
+                                        <input id="use_redacted" type="checkbox" class="bigcheck" name="use_redacted" value="1" ${config['use_redacted']} /><label for="use_redacted"><span class="option">Redacted</span></label>
                                    </div>
                                    <div class="config">
                                        <div class="row">
                                            <label>Username</label>
-                                            <input type="text" name="pth_username" value="${config['pth_username']}" size="36">
+                                            <input type="text" name="redacted_username" value="${config['redacted_username']}" size="36">
                                        </div>
                                        <div class="row">
                                            <label>Password</label>
-                                            <input type="password" name="pth_password" value="${config['pth_password'] | h}" size="36">
-                                        </div>
-                                        <div class="row">
-                                            <label>URL</label>
-                                            <input type="text" name="pth_url" value="${config['pth_url']}" size="36">
+                                            <input type="password" name="redacted_password" value="${config['redacted_password'] | h}" size="36">
                                        </div>
                                        <div class="row">
                                            <label>Seed Ratio</label>
-                                            <input type="text" class="override-float" name="pth_ratio" value="${config['pth_ratio']}" size="10" title="Stop seeding when ratio met, 0 = unlimited. Scheduled job will remove torrent when post processed and finished seeding">
+                                            <input type="text" class="override-float" name="redacted_ratio" value="${config['redacted_ratio']}" size="10" title="Stop seeding when ratio met, 0 = unlimited. Scheduled job will remove torrent when post processed and finished seeding">
                                        </div>
                                    </div>
                                </fieldset>
@@ -949,30 +945,42 @@
                                        <input type="checkbox" name="keep_nfo" value="1" ${config['keep_nfo']} />
                                    </label>
                                </div>
+                                <div class="row checkbox left clearfix nopad">
+                                    <label>
+                                        Embed lyrics
+                                        <input type="checkbox" name="embed_lyrics" value="1" ${config['embed_lyrics']}>
+                                    </label>
+                                </div>
+
+
+                                <div class="row checkbox left clearfix nopad">
+                                    <label>
+                                        Embed album art in each file
+                                        <input type="checkbox" name="embed_album_art" id="embed_album_art" value="1" ${config['embed_album_art']}>
+                                    </label>
+                                </div>
+
                                <div class="row checkbox left clearfix nopad">
                                    <label>
                                        Add album art jpeg to album folder
                                        <input type="checkbox" name="add_album_art" id="add_album_art" value="1" ${config['add_album_art']}>
                                    </label>
                                </div>
+
                                <div id="album_art_options" style="padding-left: 20px">
                                    <div class="row">
                                        as <input type="text" class="override-float" name="album_art_format" value="${config['album_art_format']}" size="10">.jpg
                                    </div>
                                    <small>Use $Artist/$artist, $Album/$album, $Year/$year, put optional variables in curly braces, use single-quote marks to escape curly braces literally ('{', '}').</small>
                                </div>
-                                <div class="row checkbox left clearfix nopad">
-                                    <label>
-                                        Embed album art in each file
-                                        <input type="checkbox" name="embed_album_art" value="1" ${config['embed_album_art']}>
-                                    </label>
-                                </div>
-                                <div class="row checkbox left clearfix nopad">
-                                    <label>
-                                        Embed lyrics
-                                        <input type="checkbox" name="embed_lyrics" value="1" ${config['embed_lyrics']}>
-                                    </label>
+
+                                <div id="album_art_size_options" style="padding-left: 20px">
+                                    <div class="row">
+                                        Album art min width <input type="text" class="override-float" name="album_art_min_width" value="${config['album_art_min_width']}" size="4" title="Only images with a pixel width greater or equal are considered as valid album art candidates. Default: 0.">\
+                                        Album art max width <input type="text" class="override-float" name="album_art_max_width" value="${config['album_art_max_width']}" size="4" title="A maximum image width to downscale fetched images if they are too big.">
+                                    </div>
                                </div>
+
                                <div class="row">
                                    <label>
                                        Destination Directory:
@@ -1903,9 +1911,36 @@
                        }
                });

+                if ($("#embed_album_art").is(":checked"))
+                        {
+                            $("#album_art_size_options").show();
+                        }
+                        else
+                        {
+                            if (!$("#add_album_art").is(":checked"))
+                            {
+                                $("#album_art_size_options").hide();
+                              }
+                        }
+
+                $("#embed_album_art").click(function(){
+                        if ($("#embed_album_art").is(":checked"))
+                        {
+                            $("#album_art_size_options").slideDown();
+                        }
+                        else
+                        {
+                            if (!$("#add_album_art").is(":checked"))
+                            {
+                                $("#album_art_size_options").slideUp();
+                            }
+                        }
+                });
+
                if ($("#add_album_art").is(":checked"))
                        {
                            $("#album_art_options").show();
+                            $("#album_art_size_options").show();
                        }
                else
                        {
@@ -1916,10 +1951,15 @@
                        if ($("#add_album_art").is(":checked"))
                        {
                            $("#album_art_options").slideDown();
+                            $("#album_art_size_options").slideDown();
                        }
                        else
                        {
                            $("#album_art_options").slideUp();
+                            if (!$("#embed_album_art").is(":checked"))
+                            {
+                                $("#album_art_size_options").slideUp();
+                            }
                        }
                });

@@ -2361,7 +2401,7 @@
                        }
                if ($("#torrent_downloader_deluge").is(":checked"))
                        {
-                            $("#torrent_blackhole_options,#transmission_options,#utorrent_options,#qbittorent_options").hide();
+                            $("#torrent_blackhole_options,#transmission_options,#utorrent_options,#qbittorrent_options").hide();
                            $("#deluge_options").show();
                        }

@@ -2514,7 +2554,7 @@
                initConfigCheckbox("#use_waffles");
                initConfigCheckbox("#use_rutracker");
                initConfigCheckbox("#use_apollo");
-                initConfigCheckbox("#use_pth");
+                initConfigCheckbox("#use_redacted");
                initConfigCheckbox("#use_strike");
                initConfigCheckbox("#api_enabled");
                initConfigCheckbox("#enable_https");
@@ -306,9 +306,10 @@ def initialize_scheduler():
                         minutes=minutes)

        # Remove Torrent + data if Post Processed and finished Seeding
-        minutes = CONFIG.TORRENT_REMOVAL_INTERVAL
-        schedule_job(torrentfinished.checkTorrentFinished, 'Torrent removal check', hours=0,
-                     minutes=minutes)
+        if headphones.CONFIG.TORRENT_DOWNLOADER != 0:
+            minutes = CONFIG.TORRENT_REMOVAL_INTERVAL
+            schedule_job(torrentfinished.checkTorrentFinished, 'Torrent removal check', hours=0,
+                         minutes=minutes)

        # Start scheduler
        if start_jobs and len(SCHED.get_jobs()):
@@ -376,7 +377,7 @@ def dbcheck():
    c.execute(
        'CREATE TABLE IF NOT EXISTS alltracks (ArtistID TEXT, ArtistName TEXT, AlbumTitle TEXT, AlbumASIN TEXT, AlbumID TEXT, TrackTitle TEXT, TrackDuration, TrackID TEXT, TrackNumber INTEGER, Location TEXT, BitRate INTEGER, CleanName TEXT, Format TEXT, ReleaseID TEXT)')
    c.execute(
-        'CREATE TABLE IF NOT EXISTS snatched (AlbumID TEXT, Title TEXT, Size INTEGER, URL TEXT, DateAdded TEXT, Status TEXT, FolderName TEXT, Kind TEXT)')
+        'CREATE TABLE IF NOT EXISTS snatched (AlbumID TEXT, Title TEXT, Size INTEGER, URL TEXT, DateAdded TEXT, Status TEXT, FolderName TEXT, Kind TEXT, TorrentHash TEXT)')
    # Matched is a temporary value used to see if there was a match found in
    # alltracks
    c.execute(
@@ -613,6 +614,12 @@ def dbcheck():
    except sqlite3.OperationalError:
        c.execute('ALTER TABLE artists ADD COLUMN MetaCritic TEXT DEFAULT NULL')

+    try:
+        c.execute('SELECT TorrentHash from snatched')
+    except sqlite3.OperationalError:
+        c.execute('ALTER TABLE snatched ADD COLUMN TorrentHash TEXT')
+        c.execute('UPDATE snatched SET TorrentHash = FolderName WHERE Status LIKE "Seed_%"')
+
    conn.commit()
    c.close()

@@ -13,16 +13,164 @@
 #  You should have received a copy of the GNU General Public License
 #  along with Headphones.  If not, see <http://www.gnu.org/licenses/>.

-from headphones import request, db, logger
+import struct
+from six.moves.urllib.parse import urlencode
+from io import BytesIO
+
+import headphones
+from headphones import db, request, logger


 def getAlbumArt(albumid):
-    myDB = db.DBConnection()
-    asin = myDB.action(
-        'SELECT AlbumASIN from albums WHERE AlbumID=?', [albumid]).fetchone()[0]

-    if asin:
-        return 'http://ec1.images-amazon.com/images/P/%s.01.LZZZZZZZ.jpg' % asin
+    artwork_path = None
+    artwork = None
+
+    # CAA
+    logger.info("Searching for artwork at CAA")
+    artwork_path = 'http://coverartarchive.org/release-group/%s/front' % albumid
+    artwork = getartwork(artwork_path)
+    if artwork:
+        logger.info("Artwork found at CAA")
+        return artwork_path, artwork
+
+    # Amazon
+    logger.info("Searching for artwork at Amazon")
+    myDB = db.DBConnection()
+    dbalbum = myDB.action(
+        'SELECT ArtistName, AlbumTitle, ReleaseID, AlbumASIN FROM albums WHERE AlbumID=?',
+        [albumid]).fetchone()
+    if dbalbum['AlbumASIN']:
+        artwork_path = 'http://ec1.images-amazon.com/images/P/%s.01.LZZZZZZZ.jpg' % dbalbum['AlbumASIN']
+        artwork = getartwork(artwork_path)
+        if artwork:
+            logger.info("Artwork found at Amazon")
+            return artwork_path, artwork
+
+    # last.fm
+    from headphones import lastfm
+    logger.info("Searching for artwork at last.fm")
+    if dbalbum['ReleaseID'] != albumid:
+        data = lastfm.request_lastfm("album.getinfo", mbid=dbalbum['ReleaseID'])
+        if not data:
+            data = lastfm.request_lastfm("album.getinfo", artist=dbalbum['ArtistName'],
+                                         album=dbalbum['AlbumTitle'])
+    else:
+        data = lastfm.request_lastfm("album.getinfo", artist=dbalbum['ArtistName'],
+                                     album=dbalbum['AlbumTitle'])
+
+    if data:
+        try:
+            images = data['album']['image']
+            for image in images:
+                if image['size'] == 'extralarge':
+                    artwork_path = image['#text']
+                elif image['size'] == 'mega':
+                    artwork_path = image['#text']
+                    break
+        except KeyError:
+            artwork_path = None
+
+        if artwork_path:
+            artwork = getartwork(artwork_path)
+            if artwork:
+                logger.info("Artwork found at last.fm")
+                return artwork_path, artwork
+
+    logger.info("No suitable album art found.")
+    return None, None
+
+
+def jpeg(bites):
+    fhandle = BytesIO(bites)
+    try:
+        fhandle.seek(0)
+        size = 2
+        ftype = 0
+        while not 0xc0 <= ftype <= 0xcf:
+            fhandle.seek(size, 1)
+            byte = fhandle.read(1)
+            while ord(byte) == 0xff:
+                byte = fhandle.read(1)
+            ftype = ord(byte)
+            size = struct.unpack('>H', fhandle.read(2))[0] - 2
+        fhandle.seek(1, 1)
+        height, width = struct.unpack('>HH', fhandle.read(4))
+        return width, height
+    except struct.error:
+        return None, None
+    except TypeError:
+        return None, None
+
+
+def png(bites):
+    try:
+        check = struct.unpack('>i', bites[4:8])[0]
+        if check != 0x0d0a1a0a:
+            return None, None
+        return struct.unpack('>ii', bites[16:24])
+    except struct.error:
+        return None, None
+
+
+def get_image_data(bites):
+    type = None
+    width = None
+    height = None
+    if len(bites) < 24:
+        return None, None, None
+
+    peek = bites[0:2]
+    if peek == b'\xff\xd8':
+        width, height = jpeg(bites)
+        type = 'jpg'
+    elif peek == b'\x89P':
+        width, height = png(bites)
+        type = 'png'
+    return type, width, height
+
+
+def getartwork(artwork_path):
+    artwork = bytes()
+    minwidth = 0
+    maxwidth = 0
+    if headphones.CONFIG.ALBUM_ART_MIN_WIDTH:
+        minwidth = int(headphones.CONFIG.ALBUM_ART_MIN_WIDTH)
+    if headphones.CONFIG.ALBUM_ART_MAX_WIDTH:
+        maxwidth = int(headphones.CONFIG.ALBUM_ART_MAX_WIDTH)
+
+    resp = request.request_response(artwork_path, timeout=20, stream=True, whitelist_status_code=404)
+
+    if resp:
+        img_width = None
+        for chunk in resp.iter_content(chunk_size=1024):
+            artwork += chunk
+            if not img_width and (minwidth or maxwidth):
+                img_type, img_width, img_height = get_image_data(artwork)
+            # Check min/max
+            if img_width and (minwidth or maxwidth):
+                if minwidth and img_width < minwidth:
+                    logger.info("Artwork is too small. Type: %s. Width: %s. Height: %s",
+                                img_type, img_width, img_height)
+                    artwork = None
+                    break
+                elif maxwidth and img_width > maxwidth:
+                    # Downsize using proxy service to max width
+                    artwork_path = '{0}?{1}'.format('http://images.weserv.nl/', urlencode({
+                        'url': artwork_path.replace('http://', ''),
+                        'w': maxwidth,
+                    }))
+                    artwork = bytes()
+                    r = request.request_response(artwork_path, timeout=20, stream=True, whitelist_status_code=404)
+                    if r:
+                        for chunk in r.iter_content(chunk_size=1024):
+                            artwork += chunk
+                        r.close()
+                        logger.info("Artwork is greater than the maximum width, downsized using proxy service")
+                    break
+        resp.close()
+
+    return artwork


 def getCachedArt(albumid):
@@ -34,6 +34,8 @@ _CONFIG_DEFINITIONS = {
    'ADD_ALBUM_ART': (int, 'General', 0),
    'ADVANCEDENCODER': (str, 'General', ''),
    'ALBUM_ART_FORMAT': (str, 'General', 'folder'),
+    'ALBUM_ART_MIN_WIDTH': (str, 'General', ''),
+    'ALBUM_ART_MAX_WIDTH': (str, 'General', ''),
    # This is used in importer.py to determine how complete an album needs to
    # be - to be considered "downloaded". Percentage from 0-100
    'ALBUM_COMPLETION_PCT': (int, 'Advanced', 80),
@@ -304,11 +306,10 @@ _CONFIG_DEFINITIONS = {
    'WAFFLES_PASSKEY': (str, 'Waffles', ''),
    'WAFFLES_RATIO': (str, 'Waffles', ''),
    'WAFFLES_UID': (str, 'Waffles', ''),
-    'PTH': (int, 'PassTheHeadphones.me', 0),
-    'PTH_PASSWORD': (str, 'PassTheHeadphones.me', ''),
-    'PTH_RATIO': (str, 'PassTheHeadphones.me', ''),
-    'PTH_USERNAME': (str, 'PassTheHeadphones.me', ''),
-    'PTH_URL': (str, 'PassTheHeadphones.me', 'https://passtheheadphones.me'),
+    'REDACTED': (int, 'Redacted', 0),
+    'REDACTED_USERNAME': (str, 'Redacted', ''),
+    'REDACTED_PASSWORD': (str, 'Redacted', ''),
+    'REDACTED_RATIO': (str, 'Redacted', ''),
    'XBMC_ENABLED': (int, 'XBMC', 0),
    'XBMC_HOST': (str, 'XBMC', ''),
    'XBMC_NOTIFY': (int, 'XBMC', 0),
@@ -49,6 +49,7 @@ delugeweb_auth = {}
 delugeweb_url = ''
 deluge_verify_cert = False
 scrub_logs = True
+headers = {'Accept': 'application/json', 'Content-Type': 'application/json'}


 def _scrubber(text):
@@ -104,11 +105,11 @@ def addTorrent(link, data=None, name=None):
                # return addTorrent(local_torrent_path)
            else:
                user_agent = 'Mozilla/5.0 (Windows NT 6.3; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2243.2 Safari/537.36'
-            headers = {'User-Agent': user_agent}
+            get_headers = {'User-Agent': user_agent}
            torrentfile = ''
            logger.debug('Deluge: Trying to download (GET)')
            try:
-                r = requests.get(link, headers=headers)
+                r = requests.get(link, headers=get_headers)
                if r.status_code == 200:
                    logger.debug('Deluge: 200 OK')
                    # .text will ruin the encoding for some torrents
@@ -202,7 +203,7 @@ def getTorrentFolder(result):
                                ],
                                "id": 21})
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
        result['total_done'] = json.loads(response.text)['result']['total_done']

        tries = 0
@@ -210,7 +211,7 @@ def getTorrentFolder(result):
            tries += 1
            time.sleep(5)
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
            result['total_done'] = json.loads(response.text)['result']['total_done']

        post_data = json.dumps({"method": "web.get_torrent_status",
@@ -229,7 +230,7 @@ def getTorrentFolder(result):
                                "id": 23})

        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)

        result['save_path'] = json.loads(response.text)['result']['save_path']
        result['name'] = json.loads(response.text)['result']['name']
@@ -245,18 +246,45 @@ def removeTorrent(torrentid, remove_data=False):
        _get_auth()

    try:
-        result = False
-        post_data = json.dumps({"method": "core.remove_torrent",
+        logger.debug('Deluge: Checking if torrent %s finished seeding' % str(torrentid))
+        post_data = json.dumps({"method": "web.get_torrent_status",
                                "params": [
                                    torrentid,
-                                    remove_data
-                                    ],
-                                "id": 25})
-        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
-        result = json.loads(response.text)['result']
+                                    [
+                                        "name",
+                                        "ratio",
+                                        "state"
+                                    ]
+                                ],
+                                "id": 26})

-        return result
+        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
+            verify=deluge_verify_cert, headers=headers)
+
+        try:
+            state = json.loads(response.text)['result']['state']
+        except KeyError as e:
+            logger.debug('Deluge: "state" KeyError when trying to remove torrent %s' % str(torrentid))
+            return False
+
+        not_finished = ["queued", "seeding", "downloading", "checking", "error"]
+        result = False
+        if state.lower() in not_finished:
+            logger.debug('Deluge: Torrent %s is either queued or seeding, not removing yet' % str(torrentid))
+            return False
+        else:
+            logger.debug('Deluge: Removing torrent %s' % str(torrentid))
+            post_data = json.dumps({"method": "core.remove_torrent",
+                                    "params": [
+                                        torrentid,
+                                        remove_data
+                                        ],
+                                    "id": 25})
+            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
+                verify=deluge_verify_cert, headers=headers)
+            result = json.loads(response.text)['result']
+
+            return result
    except Exception as e:
        logger.error('Deluge: Removing torrent failed: %s' % str(e))
        formatted_lines = traceback.format_exc().splitlines()
@@ -296,12 +324,12 @@ def _get_auth():
                            "id": 1})
    try:
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
    except requests.ConnectionError:
        try:
            logger.debug('Deluge: Connection failed, let\'s try HTTPS just in case')
            response = requests.post(delugeweb_url.replace('http:', 'https:'), data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
            # If the previous line didn't fail, change delugeweb_url for the rest of this session
            logger.error('Deluge: Switching to HTTPS, but certificate won\'t be verified because NO CERTIFICATE WAS CONFIGURED!')
            delugeweb_url = delugeweb_url.replace('http:', 'https:')
@@ -326,7 +354,7 @@ def _get_auth():
                            "id": 10})
    try:
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
    except Exception as e:
        logger.error('Deluge: Authentication failed: %s' % str(e))
        formatted_lines = traceback.format_exc().splitlines()
@@ -343,7 +371,7 @@ def _get_auth():
                                "id": 11})
        try:
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
        except Exception as e:
            logger.error('Deluge: Authentication failed: %s' % str(e))
            formatted_lines = traceback.format_exc().splitlines()
@@ -361,7 +389,7 @@ def _get_auth():

        try:
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
        except Exception as e:
            logger.error('Deluge: Authentication failed: %s' % str(e))
            formatted_lines = traceback.format_exc().splitlines()
@@ -374,7 +402,7 @@ def _get_auth():

        try:
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
        except Exception as e:
            logger.error('Deluge: Authentication failed: %s' % str(e))
            formatted_lines = traceback.format_exc().splitlines()
@@ -399,7 +427,7 @@ def _add_torrent_magnet(result):
                                "params": [result['url'], {}],
                                "id": 2})
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
        result['hash'] = json.loads(response.text)['result']
        logger.debug('Deluge: Response was %s' % str(json.loads(response.text)))
        return json.loads(response.text)['result']
@@ -419,7 +447,7 @@ def _add_torrent_url(result):
                                "params": [result['url'], {}],
                                "id": 32})
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
        result['location'] = json.loads(response.text)['result']
        logger.debug('Deluge: Response was %s' % str(json.loads(response.text)))
        return json.loads(response.text)['result']
@@ -440,7 +468,7 @@ def _add_torrent_file(result):
                                "params": [result['name'] + '.torrent', b64encode(result['content'].encode('utf8')), {}],
                                "id": 2})
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
        result['hash'] = json.loads(response.text)['result']
        logger.debug('Deluge: Response was %s' % str(json.loads(response.text)))
        return json.loads(response.text)['result']
@@ -453,7 +481,7 @@ def _add_torrent_file(result):
                                    "params": [result['name'] + '.torrent', b64encode(result['content']), {}],
                                    "id": 22})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
            result['hash'] = json.loads(response.text)['result']
            logger.debug('Deluge: Response was %s' % str(json.loads(response.text)))
            return json.loads(response.text)['result']
@@ -485,7 +513,7 @@ def setTorrentLabel(result):
                                "params": [],
                                "id": 3})
        response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-            verify=deluge_verify_cert)
+            verify=deluge_verify_cert, headers=headers)
        labels = json.loads(response.text)['result']

        if labels is not None:
@@ -496,7 +524,7 @@ def setTorrentLabel(result):
                                            "params": [label],
                                            "id": 4})
                    response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                        verify=deluge_verify_cert)
+                        verify=deluge_verify_cert, headers=headers)
                    logger.debug('Deluge: %s label added to Deluge' % label)
                except Exception as e:
                    logger.error('Deluge: Setting label failed: %s' % str(e))
@@ -508,7 +536,7 @@ def setTorrentLabel(result):
                                    "params": [result['hash'], label],
                                    "id": 5})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
            logger.debug('Deluge: %s label added to torrent' % label)
        else:
            logger.debug('Deluge: Label plugin not detected')
@@ -532,12 +560,12 @@ def setSeedRatio(result):
                                    "params": [result['hash'], True],
                                    "id": 5})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)
            post_data = json.dumps({"method": "core.set_torrent_stop_ratio",
                                    "params": [result['hash'], float(ratio)],
                                    "id": 6})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)

            return not json.loads(response.text)['error']

@@ -560,7 +588,7 @@ def setTorrentPath(result):
                                    "params": [result['hash'], True],
                                    "id": 7})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)

            if headphones.CONFIG.DELUGE_DONE_DIRECTORY:
                move_to = headphones.CONFIG.DELUGE_DONE_DIRECTORY
@@ -574,7 +602,7 @@ def setTorrentPath(result):
                                    "params": [result['hash'], move_to],
                                    "id": 8})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)

            return not json.loads(response.text)['error']

@@ -597,7 +625,7 @@ def setTorrentPause(result):
                                    "params": [[result['hash']]],
                                    "id": 9})
            response = requests.post(delugeweb_url, data=post_data.encode('utf-8'), cookies=delugeweb_auth,
-                verify=deluge_verify_cert)
+                verify=deluge_verify_cert, headers=headers)

            return not json.loads(response.text)['error']

@@ -623,7 +623,7 @@ def get_downloaded_track_list(albumpath):
    return downloaded_track_list


-def preserve_torrent_directory(albumpath, forced=False):
+def preserve_torrent_directory(albumpath, forced=False, single=False):
    """
    Copy torrent directory to temp headphones_ directory to keep files for seeding.
    """
@@ -639,7 +639,11 @@ def preserve_torrent_directory(albumpath, forced=False):
            headphones.SYS_ENCODING, 'replace'))

    try:
-        prefix = "headphones_" + os.path.basename(os.path.normpath(albumpath)) + "_"
+        file_name = os.path.basename(os.path.normpath(albumpath))
+        if not single:
+            prefix = "headphones_" + file_name + "_"
+        else:
+            prefix = "headphones_" + os.path.splitext(file_name)[0] + "_"
        new_folder = tempfile.mkdtemp(prefix=prefix, dir=tempdir)
    except Exception as e:
        logger.error("Cannot create temp directory: " + tempdir.decode(
@@ -665,7 +669,11 @@ def preserve_torrent_directory(albumpath, forced=False):
    try:
        subdir = os.path.join(new_folder, "headphones")
        logger.info("Copying files to " + subdir.decode(headphones.SYS_ENCODING, 'replace'))
-        shutil.copytree(albumpath, subdir)
+        if not single:
+            shutil.copytree(albumpath, subdir)
+        else:
+            os.makedirs(subdir)
+            shutil.copy(albumpath, subdir)
        # Update the album path with the new location
        return subdir
    except Exception as e:
@@ -28,7 +28,7 @@ from beets.mediafile import MediaFile, FileTypeError, UnreadableFileError
 from beetsplug import lyrics as beetslyrics
 from headphones import notifiers, utorrent, transmission, deluge, qbittorrent
 from headphones import db, albumart, librarysync
-from headphones import logger, helpers, request, mb, music_encoder
+from headphones import logger, helpers, mb, music_encoder
 from headphones import metadata

 postprocessor_lock = threading.Lock()
@@ -43,6 +43,8 @@ def checkFolder():

        for album in snatched:
            if album['FolderName']:
+                folder_name = album['FolderName']
+                single = False
                if album['Kind'] == 'nzb':
                    download_dir = headphones.CONFIG.DOWNLOAD_DIR
                else:
@@ -51,21 +53,29 @@ def checkFolder():
                    else:
                        download_dir = headphones.CONFIG.DOWNLOAD_TORRENT_DIR

-                album_path = os.path.join(download_dir, album['FolderName']).encode(
-                    headphones.SYS_ENCODING, 'replace')
-                logger.debug("Checking if %s exists" % album_path)
+                    # Qbittorrent - get folder from torrent hash
+                    if album['TorrentHash']:
+                        if headphones.CONFIG.TORRENT_DOWNLOADER == 4:
+                            torrent_folder_name, single = qbittorrent.getFolder(album['TorrentHash'])
+                            if torrent_folder_name:
+                                folder_name = torrent_folder_name

-                if os.path.exists(album_path):
-                    logger.info('Found "' + album['FolderName'] + '" in ' + album[
-                        'Kind'] + ' download folder. Verifying....')
-                    verify(album['AlbumID'], album_path, album['Kind'])
+                if folder_name:
+                    album_path = os.path.join(download_dir, folder_name).encode(
+                        headphones.SYS_ENCODING, 'replace')
+                    logger.debug("Checking if %s exists" % album_path)
+
+                    if os.path.exists(album_path):
+                        logger.info('Found "' + folder_name + '" in ' + album[
+                            'Kind'] + ' download folder. Verifying....')
+                        verify(album['AlbumID'], album_path, album['Kind'], single=single)
            else:
                logger.info("No folder name found for " + album['Title'])

    logger.debug("Checking download folder finished.")


-def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=False):
+def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=False, single=False):
    myDB = db.DBConnection()
    release = myDB.action('SELECT * from albums WHERE AlbumID=?', [albumid]).fetchone()
    tracks = myDB.select('SELECT * from tracks WHERE AlbumID=?', [albumid])
@@ -206,6 +216,10 @@ def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=Fal
                                                                       'replace') + " isn't complete yet. Will try again on the next run")
                return

+    # Force single file through
+    if single and not downloaded_track_list:
+        downloaded_track_list.append(albumpath)
+
    # Check to see if we're preserving the torrent dir
    if (headphones.CONFIG.KEEP_TORRENT_FILES and Kind == "torrent") or headphones.CONFIG.KEEP_ORIGINAL_FOLDER:
        keep_original_folder = True
@@ -263,7 +277,7 @@ def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=Fal

        if metaartist == dbartist and metaalbum == dbalbum:
            doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list, Kind,
-                             keep_original_folder, forced)
+                             keep_original_folder, forced, single)
            return

    # test #2: filenames
@@ -282,7 +296,7 @@ def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=Fal

            if dbtrack in filetrack:
                doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list, Kind,
-                                 keep_original_folder, forced)
+                                 keep_original_folder, forced, single)
                return

    # test #3: number of songs and duration
@@ -315,7 +329,7 @@ def verify(albumid, albumpath, Kind=None, forced=False, keep_original_folder=Fal
            delta = abs(downloaded_track_duration - db_track_duration)
            if delta < 240:
                doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list, Kind,
-                                 keep_original_folder, forced)
+                                 keep_original_folder, forced, single)
                return

    logger.warn(u'Could not identify album: %s. It may not be the intended album.',
@@ -337,13 +351,13 @@ def markAsUnprocessed(albumid, albumpath, keep_original_folder=False):


 def doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list, Kind=None,
-                     keep_original_folder=False, forced=False):
+                     keep_original_folder=False, forced=False, single=False):
    logger.info('Starting post-processing for: %s - %s' % (release['ArtistName'], release['AlbumTitle']))
    new_folder = None

    # Preserve the torrent dir
-    if keep_original_folder:
-        temp_path = helpers.preserve_torrent_directory(albumpath, forced)
+    if keep_original_folder or single:
+        temp_path = helpers.preserve_torrent_directory(albumpath, forced, single)
        if not temp_path:
            markAsUnprocessed(albumid, albumpath, keep_original_folder)
            return
@@ -375,7 +389,8 @@ def doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list,
                         downloaded_track.decode(headphones.SYS_ENCODING, "replace"))
            return
        except IOError:
-            logger.error("Unable to find media file: %s. Not continuing.")
+            logger.error("Unable to find media file: %s. Not continuing.", downloaded_track.decode(
+                headphones.SYS_ENCODING, "replace"))
            if new_folder:
                shutil.rmtree(new_folder)
            return
@@ -410,21 +425,13 @@ def doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list,
                shutil.rmtree(new_folder)
            return

+    # get artwork and path
+    album_art_path = None
    artwork = None
-    album_art_path = albumart.getAlbumArt(albumid)
-    if headphones.CONFIG.EMBED_ALBUM_ART or headphones.CONFIG.ADD_ALBUM_ART:
-
-        if album_art_path:
-            artwork = request.request_content(album_art_path)
-        else:
-            artwork = None
-
-        if not album_art_path or not artwork or len(artwork) < 100:
-            logger.info("No suitable album art found from Amazon. Checking Last.FM....")
-            artwork = albumart.getCachedArt(albumid)
-            if not artwork or len(artwork) < 100:
-                artwork = False
-                logger.info("No suitable album art found from Last.FM. Not adding album art")
+    if headphones.CONFIG.EMBED_ALBUM_ART or headphones.CONFIG.ADD_ALBUM_ART or \
+            (headphones.CONFIG.PLEX_ENABLED and headphones.CONFIG.PLEX_NOTIFY) or \
+            (headphones.CONFIG.XBMC_ENABLED and headphones.CONFIG.XBMC_NOTIFY):
+        album_art_path, artwork = albumart.getAlbumArt(albumid)

    if headphones.CONFIG.EMBED_ALBUM_ART and artwork:
        embedAlbumArt(artwork, downloaded_track_list)
@@ -474,7 +481,7 @@ def doPostProcessing(albumid, albumpath, release, tracks, downloaded_track_list,
            'SELECT * from snatched WHERE Status="Seed_Snatched" and AlbumID=?',
            [albumid]).fetchone()
        if seed_snatched:
-            hash = seed_snatched['FolderName']
+            hash = seed_snatched['TorrentHash']
            torrent_removed = False
            logger.info(u'%s - %s. Checking if torrent has finished seeding and can be removed' % (
                release['ArtistName'], release['AlbumTitle']))
@@ -944,11 +951,13 @@ def correctMetadata(albumid, release, downloaded_track_list):
            continue

        try:
-            cur_artist, cur_album, candidates, rec = autotag.tag_album(items,
-                                                                       search_artist=helpers.latinToAscii(
-                                                                           release['ArtistName']),
-                                                                       search_album=helpers.latinToAscii(
-                                                                           release['AlbumTitle']))
+            cur_artist, cur_album, prop = autotag.tag_album(items,
+                                                            search_artist=helpers.latinToAscii(
+                                                                release['ArtistName']),
+                                                            search_album=helpers.latinToAscii(
+                                                                release['AlbumTitle']))
+            candidates = prop.candidates
+            rec = prop.recommendation
        except Exception as e:
            logger.error('Error getting recommendation: %s. Not writing metadata', e)
            return False
@@ -17,11 +17,11 @@ import urllib
 import urllib2
 import cookielib
 import json
-import os
 import time
 import mimetypes
 import random
 import string
+import os

 import headphones

@@ -198,37 +198,45 @@ def addFile(data):
    return qbclient._command('command/upload', filelist=files)


-def getFolder(hash):
-    logger.debug('getFolder(%s)' % hash)
+def getName(hash):
+    logger.debug('getName(%s)' % hash)

    qbclient = qbittorrentclient()

-    # Get Active Directory from settings
-    settings = qbclient._get_settings()
-    active_dir = settings['temp_path']
+    tries = 1
+    while tries <= 6:
+        time.sleep(10)
+        status, torrentlist = qbclient._get_list()
+        for torrent in torrentlist:
+            if torrent['hash'].lower() == hash.lower():
+                return torrent['name']
+        tries += 1

-    if not active_dir:
-        logger.error('Could not get "Keep incomplete torrents in:" directory from QBitTorrent settings, please ensure it is set')
-        return None
+    return None

-    # Get Torrent Folder Name
-    torrent_folder = qbclient.get_savepath(hash)

-    # If there's no folder yet then it's probably a magnet, try until folder is populated
-    if torrent_folder == active_dir or not torrent_folder:
-        tries = 1
-        while (torrent_folder == active_dir or torrent_folder is None) and tries <= 10:
-            tries += 1
-            time.sleep(6)
-            torrent_folder = qbclient.get_savepath(hash)
+def getFolder(hash):
+    logger.debug('getFolder(%s)' % hash)

-    if torrent_folder == active_dir or not torrent_folder:
-        torrent_folder = qbclient.get_savepath(hash)
-        return torrent_folder
-    else:
-        if headphones.SYS_PLATFORM != "win32":
-            torrent_folder = torrent_folder.replace('\\', '/')
-        return os.path.basename(os.path.normpath(torrent_folder))
+    torrent_folder = None
+    single_file = False
+
+    qbclient = qbittorrentclient()
+
+    try:
+        status, torrent_files = qbclient.getfiles(hash.lower())
+        if torrent_files:
+            if len(torrent_files) == 1:
+                torrent_folder = torrent_files[0]['name']
+                single_file = True
+            else:
+                torrent_folder = os.path.split(torrent_files[0]['name'])[0]
+                single_file = False
+    except:
+        torrent_folder = None
+        single_file = False
+
+    return torrent_folder, single_file


 _BOUNDARY_CHARS = string.digits + string.ascii_letters
@@ -6,6 +6,7 @@ from urlparse import urlparse
 import re

 import requests as requests
+# from requests.auth import HTTPDigestAuth
 from bs4 import BeautifulSoup

 import headphones
@@ -216,3 +217,37 @@ class Rutracker(object):
            self.session.post(url, params={'action': 'add-file'}, files=files)
        except Exception as e:
            logger.exception('Error adding file to utorrent %s', e)
+
+    # TODO get this working in qbittorrent.py
+    def qbittorrent_add_file(self, data):
+        host = headphones.CONFIG.QBITTORRENT_HOST
+        if not host.startswith('http'):
+            host = 'http://' + host
+        if host.endswith('/'):
+            host = host[:-1]
+        if host.endswith('/gui'):
+            host = host[:-4]
+        base_url = host
+
+        # self.session.auth = HTTPDigestAuth(headphones.CONFIG.QBITTORRENT_USERNAME, headphones.CONFIG.QBITTORRENT_PASSWORD)
+
+        url = base_url + '/login'
+        try:
+            self.session.post(url, data={'username': headphones.CONFIG.QBITTORRENT_USERNAME,
+                                         'password': headphones.CONFIG.QBITTORRENT_PASSWORD})
+        except Exception as e:
+            logger.exception('Error adding file to qbittorrent %s', e)
+            return
+
+        url = base_url + '/command/upload'
+
+        args = {'savepath': headphones.CONFIG.DOWNLOAD_TORRENT_DIR}
+        if headphones.CONFIG.QBITTORRENT_LABEL:
+            args['category'] = headphones.CONFIG.QBITTORRENT_LABEL
+
+        torrent_files = {'torrents': data}
+
+        try:
+            self.session.post(url, data=args, files=torrent_files)
+        except Exception as e:
+            logger.exception('Error adding file to qbittorrent %s', e)
@@ -47,9 +47,9 @@ TORRENT_TO_MAGNET_SERVICES = [

 # Persistent Apollo.rip API object
 apolloobj = None
-# Persistent PTH API object
 ruobj = None
-pthobj = None
+# Persistent RED API object
+redobj = None


 def fix_url(s, charset="utf-8"):
@@ -164,8 +164,8 @@ def get_seed_ratio(provider):
        seed_ratio = headphones.CONFIG.KAT_RATIO
    elif provider == 'Apollo.rip':
        seed_ratio = headphones.CONFIG.APOLLO_RATIO
-    elif provider == 'PassTheHeadphones.Me':
-        seed_ratio = headphones.CONFIG.PTH_RATIO
+    elif provider == 'Redacted':
+        seed_ratio = headphones.CONFIG.REDACTED_RATIO
    elif provider == 'The Pirate Bay':
        seed_ratio = headphones.CONFIG.PIRATEBAY_RATIO
    elif provider == 'Old Pirate Bay':
@@ -277,7 +277,7 @@ def do_sorted_search(album, new, losslessOnly, choose_specific_download=False):
                         headphones.CONFIG.WAFFLES or
                         headphones.CONFIG.RUTRACKER or
                         headphones.CONFIG.APOLLO or
-                         headphones.CONFIG.PTH or
+                         headphones.CONFIG.REDACTED or
                         headphones.CONFIG.STRIKE or
                         headphones.CONFIG.TQUATTRECENTONZE)

@@ -1018,36 +1018,37 @@ def send_to_downloader(data, bestqual, album):

            # Add torrent
            if bestqual[3] == 'rutracker.org':
-                qbittorrent.addFile(data)
+                ruobj.qbittorrent_add_file(data)
            else:
                qbittorrent.addTorrent(bestqual[2])

            # Get hash
            torrentid = calculate_torrent_hash(bestqual[2], data)
+            torrentid = torrentid.lower()
            if not torrentid:
                logger.error('Torrent id could not be determined')
                return

-            # Get folder
-            folder_name = qbittorrent.getFolder(torrentid)
+            # Get name
+            folder_name = qbittorrent.getName(torrentid)
            if folder_name:
-                logger.info('Torrent folder name: %s' % folder_name)
+                logger.info('Torrent name: %s' % folder_name)
            else:
-                logger.error('Torrent folder name could not be determined')
+                logger.error('Torrent name could not be determined')
                return

    myDB = db.DBConnection()
    myDB.action('UPDATE albums SET status = "Snatched" WHERE AlbumID=?', [album['AlbumID']])
-    myDB.action('INSERT INTO snatched VALUES( ?, ?, ?, ?, DATETIME("NOW", "localtime"), ?, ?, ?)',
+    myDB.action('INSERT INTO snatched VALUES( ?, ?, ?, ?, DATETIME("NOW", "localtime"), ?, ?, ?, ?)',
                [album['AlbumID'], bestqual[0], bestqual[1], bestqual[2], "Snatched", folder_name,
-                 kind])
+                 kind, torrentid])

    # Store the torrent id so we can check later if it's finished seeding and can be removed
    if seed_ratio is not None and seed_ratio != 0 and torrentid:
        myDB.action(
-            'INSERT INTO snatched VALUES( ?, ?, ?, ?, DATETIME("NOW", "localtime"), ?, ?, ?)',
-            [album['AlbumID'], bestqual[0], bestqual[1], bestqual[2], "Seed_Snatched", torrentid,
-             kind])
+            'INSERT INTO snatched VALUES( ?, ?, ?, ?, DATETIME("NOW", "localtime"), ?, ?, ?, ?)',
+            [album['AlbumID'], bestqual[0], bestqual[1], bestqual[2], "Seed_Snatched", folder_name,
+             kind, torrentid])

    # notify
    artist = album[1]
@@ -1206,7 +1207,7 @@ def verifyresult(title, artistterm, term, lossless):
 def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
                  choose_specific_download=False):
    global apolloobj  # persistent apollo.rip api object to reduce number of login attempts
-    global pthobj  # persistent pth api object to reduce number of login attempts
+    global redobj  # persistent redacted api object to reduce number of login attempts
    global ruobj  # and rutracker

    reldate = album['ReleaseDate']
@@ -1436,8 +1437,9 @@ def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
            query_items = [usersearchterm]

        query_items.extend(['format:(%s)' % format,
-                            'size:[0 TO %d]' % maxsize,
-                            '-seeders:0'])  # cut out dead torrents
+                            'size:[0 TO %d]' % maxsize])
+        # (25/03/2017 Waffles back up after 5 months, all torrents currently have no seeders, remove for now)
+        # '-seeders:0'])  cut out dead torrents

        if bitrate:
            query_items.append('bitrate:"%s"' % bitrate)
@@ -1612,10 +1614,10 @@ def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
                                   provider,
                                   'torrent', True))

-    # PassTheHeadphones.me - Using same logic as What.CD as it's also Gazelle, so should really make this into something reusable
-    if headphones.CONFIG.PTH:
-        provider = "PassTheHeadphones.me"
-        providerurl = "https://passtheheadphones.me/"
+    # Redacted - Using same logic as What.CD as it's also Gazelle, so should really make this into something reusable
+    if headphones.CONFIG.REDACTED:
+        provider = "Redacted"
+        providerurl = "https://redacted.ch"

        bitrate = None
        bitrate_string = bitrate
@@ -1638,7 +1640,7 @@ def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
                        bitrate_string = encoding_string
                if bitrate_string not in gazelleencoding.ALL_ENCODINGS:
                    logger.info(
-                        u"Your preferred bitrate is not one of the available PTH filters, so not using it as a search parameter.")
+                        u"Your preferred bitrate is not one of the available RED filters, so not using it as a search parameter.")
            maxsize = 10000000000
        elif headphones.CONFIG.PREFERRED_QUALITY == 1 or allow_lossless:  # Highest quality including lossless
            search_formats = [gazelleformat.FLAC, gazelleformat.MP3]
@@ -1647,28 +1649,28 @@ def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
            search_formats = [gazelleformat.MP3]
            maxsize = 300000000

-        if not pthobj or not pthobj.logged_in():
+        if not redobj or not redobj.logged_in():
            try:
-                logger.info(u"Attempting to log in to PassTheHeadphones.me...")
-                pthobj = gazelleapi.GazelleAPI(headphones.CONFIG.PTH_USERNAME,
-                                                headphones.CONFIG.PTH_PASSWORD,
-                                                headphones.CONFIG.PTH_URL)
-                pthobj._login()
+                logger.info(u"Attempting to log in to Redacted...")
+                redobj = gazelleapi.GazelleAPI(headphones.CONFIG.REDACTED_USERNAME,
+                                                headphones.CONFIG.REDACTED_PASSWORD,
+                                                providerurl)
+                redobj._login()
            except Exception as e:
-                pthobj = None
-                logger.error(u"PassTheHeadphones credentials incorrect or site is down. Error: %s %s" % (
+                redobj = None
+                logger.error(u"Redacted credentials incorrect or site is down. Error: %s %s" % (
                    e.__class__.__name__, str(e)))

-        if pthobj and pthobj.logged_in():
+        if redobj and redobj.logged_in():
            logger.info(u"Searching %s..." % provider)
            all_torrents = []
            for search_format in search_formats:
                if usersearchterm:
                    all_torrents.extend(
-                        pthobj.search_torrents(searchstr=usersearchterm, format=search_format,
+                        redobj.search_torrents(searchstr=usersearchterm, format=search_format,
                                                encoding=bitrate_string)['results'])
                else:
-                    all_torrents.extend(pthobj.search_torrents(artistname=semi_clean_artist_term,
+                    all_torrents.extend(redobj.search_torrents(artistname=semi_clean_artist_term,
                                                                groupname=semi_clean_album_term,
                                                                format=search_format,
                                                                encoding=bitrate_string)['results'])
@@ -1708,7 +1710,7 @@ def searchTorrent(album, new=False, losslessOnly=False, albumlength=None,
                    torrent.group.update_group_data()  # will load the file_path for the individual torrents
                resultlist.append((torrent.file_path,
                                   torrent.size,
-                                   pthobj.generate_torrent_link(torrent.id),
+                                   redobj.generate_torrent_link(torrent.id),
                                   provider,
                                   'torrent', True))

@@ -2055,7 +2057,7 @@ def preprocess(resultlist):
                headers['User-Agent'] = USER_AGENT
            elif result[3] == 'Apollo.rip':
                headers['User-Agent'] = 'Headphones'
-            elif result[3] == 'PassTheHeadphones.me':
+            elif result[3] == 'Redacted':
                headers['User-Agent'] = 'Headphones'
            elif result[3] == "The Pirate Bay" or result[3] == "Old Pirate Bay":
                headers[
@@ -13,13 +13,10 @@
 #  You should have received a copy of the GNU General Public License
 #  along with Headphones.  If not, see <http://www.gnu.org/licenses/>.

-import threading

-from headphones import db, utorrent, transmission, logger
+from headphones import db, utorrent, transmission, deluge, qbittorrent, logger
 import headphones

-postprocessor_lock = threading.Lock()
-

 def checkTorrentFinished():
    """
@@ -28,21 +25,25 @@ def checkTorrentFinished():

    logger.info("Checking if any torrents have finished seeding and can be removed")

-    with postprocessor_lock:
-        myDB = db.DBConnection()
-        results = myDB.select('SELECT * from snatched WHERE Status="Seed_Processed"')
+    myDB = db.DBConnection()
+    results = myDB.select('SELECT * from snatched WHERE Status="Seed_Processed"')

-        for album in results:
-            hash = album['FolderName']
-            albumid = album['AlbumID']
-            torrent_removed = False
-            if headphones.CONFIG.TORRENT_DOWNLOADER == 1:
-                torrent_removed = transmission.removeTorrent(hash, True)
-            else:
-                torrent_removed = utorrent.removeTorrent(hash, True)
+    for album in results:
+        hash = album['TorrentHash']
+        albumid = album['AlbumID']
+        torrent_removed = False

-            if torrent_removed:
-                myDB.action('DELETE from snatched WHERE status = "Seed_Processed" and AlbumID=?',
-                            [albumid])
+        if headphones.CONFIG.TORRENT_DOWNLOADER == 1:
+            torrent_removed = transmission.removeTorrent(hash, True)
+        elif headphones.CONFIG.TORRENT_DOWNLOADER == 2:
+            torrent_removed = utorrent.removeTorrent(hash, True)
+        elif headphones.CONFIG.TORRENT_DOWNLOADER == 3:
+            torrent_removed = deluge.removeTorrent(hash, True)
+        else:
+            torrent_removed = qbittorrent.removeTorrent(hash, True)
+
+        if torrent_removed:
+            myDB.action('DELETE from snatched WHERE status = "Seed_Processed" and AlbumID=?',
+                        [albumid])

    logger.info("Checking finished torrents completed")
@@ -1234,11 +1234,10 @@ class WebInterface(object):
            "apollo_password": headphones.CONFIG.APOLLO_PASSWORD,
            "apollo_ratio": headphones.CONFIG.APOLLO_RATIO,
            "apollo_url": headphones.CONFIG.APOLLO_URL,
-            "use_pth": checked(headphones.CONFIG.PTH),
-            "pth_username": headphones.CONFIG.PTH_USERNAME,
-            "pth_password": headphones.CONFIG.PTH_PASSWORD,
-            "pth_ratio": headphones.CONFIG.PTH_RATIO,
-            "pth_url": headphones.CONFIG.PTH_URL,
+            "use_redacted": checked(headphones.CONFIG.REDACTED),
+            "redacted_username": headphones.CONFIG.REDACTED_USERNAME,
+            "redacted_password": headphones.CONFIG.REDACTED_PASSWORD,
+            "redacted_ratio": headphones.CONFIG.REDACTED_RATIO,
            "use_strike": checked(headphones.CONFIG.STRIKE),
            "strike_ratio": headphones.CONFIG.STRIKE_RATIO,
            "use_tquattrecentonze": checked(headphones.CONFIG.TQUATTRECENTONZE),
@@ -1267,6 +1266,8 @@ class WebInterface(object):
            "keep_nfo": checked(headphones.CONFIG.KEEP_NFO),
            "add_album_art": checked(headphones.CONFIG.ADD_ALBUM_ART),
            "album_art_format": headphones.CONFIG.ALBUM_ART_FORMAT,
+            "album_art_min_width": headphones.CONFIG.ALBUM_ART_MIN_WIDTH,
+            "album_art_max_width": headphones.CONFIG.ALBUM_ART_MAX_WIDTH,
            "embed_album_art": checked(headphones.CONFIG.EMBED_ALBUM_ART),
            "embed_lyrics": checked(headphones.CONFIG.EMBED_LYRICS),
            "replace_existing_folders": checked(headphones.CONFIG.REPLACE_EXISTING_FOLDERS),
@@ -1,21 +0,0 @@
-The MIT License
-
-Copyright (c) 2010-2014 Adrian Sampson
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in
-all copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
-THE SOFTWARE.
@@ -1,94 +0,0 @@
-.. image:: https://travis-ci.org/sampsyo/beets.svg?branch=master
-    :target: https://travis-ci.org/sampsyo/beets
-
-.. image:: http://img.shields.io/coveralls/sampsyo/beets.svg
-    :target: https://coveralls.io/r/sampsyo/beets
-
-.. image:: http://img.shields.io/pypi/v/beets.svg
-    :target: https://pypi.python.org/pypi/beets
-
-Beets is the media library management system for obsessive-compulsive music
-geeks.
-
-The purpose of beets is to get your music collection right once and for all.
-It catalogs your collection, automatically improving its metadata as it goes.
-It then provides a bouquet of tools for manipulating and accessing your music.
-
-Here's an example of beets' brainy tag corrector doing its thing::
-
-  $ beet import ~/music/ladytron
-  Tagging:
-      Ladytron - Witching Hour
-  (Similarity: 98.4%)
-   * Last One Standing      -> The Last One Standing
-   * Beauty                 -> Beauty*2
-   * White Light Generation -> Whitelightgenerator
-   * All the Way            -> All the Way...
-
-Because beets is designed as a library, it can do almost anything you can
-imagine for your music collection. Via `plugins`_, beets becomes a panacea:
-
- Fetch or calculate all the metadata you could possibly need: `album art`_,
-  `lyrics`_, `genres`_, `tempos`_, `ReplayGain`_ levels, or `acoustic
-  fingerprints`_.
- Get metadata from `MusicBrainz`_, `Discogs`_, or `Beatport`_. Or guess
-  metadata using songs' filenames or their acoustic fingerprints.
- `Transcode audio`_ to any format you like.
- Check your library for `duplicate tracks and albums`_ or for `albums that
-  are missing tracks`_.
- Clean up crufty tags left behind by other, less-awesome tools.
- Embed and extract album art from files' metadata.
- Browse your music library graphically through a Web browser and play it in any
-  browser that supports `HTML5 Audio`_.
- Analyze music files' metadata from the command line.
- Listen to your library with a music player that speaks the `MPD`_ protocol
-  and works with a staggering variety of interfaces.
-
-If beets doesn't do what you want yet, `writing your own plugin`_ is
-shockingly simple if you know a little Python.
-
-.. _plugins: http://beets.readthedocs.org/page/plugins/
-.. _MPD: http://www.musicpd.org/
-.. _MusicBrainz music collection: http://musicbrainz.org/doc/Collections/
-.. _writing your own plugin:
-    http://beets.readthedocs.org/page/dev/plugins.html
-.. _HTML5 Audio:
-    http://www.w3.org/TR/html-markup/audio.html
-.. _albums that are missing tracks:
-    http://beets.readthedocs.org/page/plugins/missing.html
-.. _duplicate tracks and albums:
-    http://beets.readthedocs.org/page/plugins/duplicates.html
-.. _Transcode audio:
-    http://beets.readthedocs.org/page/plugins/convert.html
-.. _Beatport: http://www.beatport.com/
-.. _Discogs: http://www.discogs.com/
-.. _acoustic fingerprints:
-    http://beets.readthedocs.org/page/plugins/chroma.html
-.. _ReplayGain: http://beets.readthedocs.org/page/plugins/replaygain.html
-.. _tempos: http://beets.readthedocs.org/page/plugins/echonest.html
-.. _genres: http://beets.readthedocs.org/page/plugins/lastgenre.html
-.. _album art: http://beets.readthedocs.org/page/plugins/fetchart.html
-.. _lyrics: http://beets.readthedocs.org/page/plugins/lyrics.html
-.. _MusicBrainz: http://musicbrainz.org/
-
-Read More
---------
-
-Learn more about beets at `its Web site`_. Follow `@b33ts`_ on Twitter for
-news and updates.
-
-You can install beets by typing ``pip install beets``. Then check out the
-`Getting Started`_ guide.
-
-.. _its Web site: http://beets.radbox.org/
-.. _Getting Started: http://beets.readthedocs.org/page/guides/main.html
-.. _@b33ts: http://twitter.com/b33ts/
-
-Authors
-------
-
-Beets is by `Adrian Sampson`_ with a supporting cast of thousands. For help,
-please contact the `mailing list`_.
-
-.. _mailing list: https://groups.google.com/forum/#!forum/beets-users
-.. _Adrian Sampson: http://homes.cs.washington.edu/~asampson/
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -12,17 +13,33 @@
 # The above copyright notice and this permission notice shall be
 # included in all copies or substantial portions of the Software.

-# This particular version has been slightly modified to work with Headphones
-# https://github.com/rembo10/headphones
-
-__version__ = '1.3.10-headphones'
-__author__ = 'Adrian Sampson <adrian@radbox.org>'
+from __future__ import division, absolute_import, print_function

 import os

-import beets.library
 from beets.util import confit

-Library = beets.library.Library
+# This particular version has been slightly modified to work with Headphones
+# https://github.com/rembo10/headphones
+__version__ = u'1.4.4-headphones'
+__author__ = u'Adrian Sampson <adrian@radbox.org>'

-config = confit.LazyConfig(os.path.dirname(__file__), __name__)
+
+class IncludeLazyConfig(confit.LazyConfig):
+    """A version of Confit's LazyConfig that also merges in data from
+    YAML files specified in an `include` setting.
+    """
+    def read(self, user=True, defaults=True):
+        super(IncludeLazyConfig, self).read(user, defaults)
+
+        try:
+            for view in self['include']:
+                filename = view.as_filename()
+                if os.path.isfile(filename):
+                    self.set_file(filename)
+        except confit.NotFoundError:
+            pass
+
+# headphones
+#config = IncludeLazyConfig('beets', __name__)
+config = IncludeLazyConfig(os.path.dirname(__file__), __name__)
@@ -0,0 +1,26 @@
+# -*- coding: utf-8 -*-
+# This file is part of beets.
+# Copyright 2017, Adrian Sampson.
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+"""The __main__ module lets you run the beets CLI interface by typing
+`python -m beets`.
+"""
+
+from __future__ import division, absolute_import, print_function
+
+import sys
+from .ui import main
+
+if __name__ == "__main__":
+    main(sys.argv[1:])
@@ -0,0 +1,222 @@
+# -*- coding: utf-8 -*-
+# This file is part of beets.
+# Copyright 2016, Adrian Sampson.
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+"""High-level utilities for manipulating image files associated with
+music and items' embedded album art.
+"""
+
+from __future__ import division, absolute_import, print_function
+
+import subprocess
+import platform
+from tempfile import NamedTemporaryFile
+import os
+
+from beets.util import displayable_path, syspath, bytestring_path
+from beets.util.artresizer import ArtResizer
+from beets import mediafile
+
+
+def mediafile_image(image_path, maxwidth=None):
+    """Return a `mediafile.Image` object for the path.
+    """
+
+    with open(syspath(image_path), 'rb') as f:
+        data = f.read()
+    return mediafile.Image(data, type=mediafile.ImageType.front)
+
+
+def get_art(log, item):
+    # Extract the art.
+    try:
+        mf = mediafile.MediaFile(syspath(item.path))
+    except mediafile.UnreadableFileError as exc:
+        log.warning(u'Could not extract art from {0}: {1}',
+                    displayable_path(item.path), exc)
+        return
+
+    return mf.art
+
+
+def embed_item(log, item, imagepath, maxwidth=None, itempath=None,
+               compare_threshold=0, ifempty=False, as_album=False):
+    """Embed an image into the item's media file.
+    """
+    # Conditions and filters.
+    if compare_threshold:
+        if not check_art_similarity(log, item, imagepath, compare_threshold):
+            log.info(u'Image not similar; skipping.')
+            return
+    if ifempty and get_art(log, item):
+            log.info(u'media file already contained art')
+            return
+    if maxwidth and not as_album:
+        imagepath = resize_image(log, imagepath, maxwidth)
+
+    # Get the `Image` object from the file.
+    try:
+        log.debug(u'embedding {0}', displayable_path(imagepath))
+        image = mediafile_image(imagepath, maxwidth)
+    except IOError as exc:
+        log.warning(u'could not read image file: {0}', exc)
+        return
+
+    # Make sure the image kind is safe (some formats only support PNG
+    # and JPEG).
+    if image.mime_type not in ('image/jpeg', 'image/png'):
+        log.info('not embedding image of unsupported type: {}',
+                 image.mime_type)
+        return
+
+    item.try_write(path=itempath, tags={'images': [image]})
+
+
+def embed_album(log, album, maxwidth=None, quiet=False,
+                compare_threshold=0, ifempty=False):
+    """Embed album art into all of the album's items.
+    """
+    imagepath = album.artpath
+    if not imagepath:
+        log.info(u'No album art present for {0}', album)
+        return
+    if not os.path.isfile(syspath(imagepath)):
+        log.info(u'Album art not found at {0} for {1}',
+                 displayable_path(imagepath), album)
+        return
+    if maxwidth:
+        imagepath = resize_image(log, imagepath, maxwidth)
+
+    log.info(u'Embedding album art into {0}', album)
+
+    for item in album.items():
+        embed_item(log, item, imagepath, maxwidth, None,
+                   compare_threshold, ifempty, as_album=True)
+
+
+def resize_image(log, imagepath, maxwidth):
+    """Returns path to an image resized to maxwidth.
+    """
+    log.debug(u'Resizing album art to {0} pixels wide', maxwidth)
+    imagepath = ArtResizer.shared.resize(maxwidth, syspath(imagepath))
+    return imagepath
+
+
+def check_art_similarity(log, item, imagepath, compare_threshold):
+    """A boolean indicating if an image is similar to embedded item art.
+    """
+    with NamedTemporaryFile(delete=True) as f:
+        art = extract(log, f.name, item)
+
+        if art:
+            is_windows = platform.system() == "Windows"
+
+            # Converting images to grayscale tends to minimize the weight
+            # of colors in the diff score. So we first convert both images
+            # to grayscale and then pipe them into the `compare` command.
+            # On Windows, ImageMagick doesn't support the magic \\?\ prefix
+            # on paths, so we pass `prefix=False` to `syspath`.
+            convert_cmd = ['convert', syspath(imagepath, prefix=False),
+                           syspath(art, prefix=False),
+                           '-colorspace', 'gray', 'MIFF:-']
+            compare_cmd = ['compare', '-metric', 'PHASH', '-', 'null:']
+            log.debug(u'comparing images with pipeline {} | {}',
+                      convert_cmd, compare_cmd)
+            convert_proc = subprocess.Popen(
+                convert_cmd,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+                close_fds=not is_windows,
+            )
+            compare_proc = subprocess.Popen(
+                compare_cmd,
+                stdin=convert_proc.stdout,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+                close_fds=not is_windows,
+            )
+
+            # Check the convert output. We're not interested in the
+            # standard output; that gets piped to the next stage.
+            convert_proc.stdout.close()
+            convert_stderr = convert_proc.stderr.read()
+            convert_proc.stderr.close()
+            convert_proc.wait()
+            if convert_proc.returncode:
+                log.debug(
+                    u'ImageMagick convert failed with status {}: {!r}',
+                    convert_proc.returncode,
+                    convert_stderr,
+                )
+                return
+
+            # Check the compare output.
+            stdout, stderr = compare_proc.communicate()
+            if compare_proc.returncode:
+                if compare_proc.returncode != 1:
+                    log.debug(u'ImageMagick compare failed: {0}, {1}',
+                              displayable_path(imagepath),
+                              displayable_path(art))
+                    return
+                out_str = stderr
+            else:
+                out_str = stdout
+
+            try:
+                phash_diff = float(out_str)
+            except ValueError:
+                log.debug(u'IM output is not a number: {0!r}', out_str)
+                return
+
+            log.debug(u'ImageMagick compare score: {0}', phash_diff)
+            return phash_diff <= compare_threshold
+
+    return True
+
+
+def extract(log, outpath, item):
+    art = get_art(log, item)
+    outpath = bytestring_path(outpath)
+    if not art:
+        log.info(u'No album art present in {0}, skipping.', item)
+        return
+
+    # Add an extension to the filename.
+    ext = mediafile.image_extension(art)
+    if not ext:
+        log.warning(u'Unknown image type in {0}.',
+                    displayable_path(item.path))
+        return
+    outpath += bytestring_path('.' + ext)
+
+    log.info(u'Extracting album art from: {0} to: {1}',
+             item, displayable_path(outpath))
+    with open(syspath(outpath), 'wb') as f:
+        f.write(art)
+    return outpath
+
+
+def extract_first(log, outpath, items):
+    for item in items:
+        real_path = extract(log, outpath, item)
+        if real_path:
+            return real_path
+
+
+def clear(log, lib, query):
+    items = lib.items(query)
+    log.info(u'Clearing album art from {0} items', len(items))
+    for item in items:
+        log.debug(u'Clearing art for {0}', item)
+        item.try_write(tags={'images': None})
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,13 +15,15 @@

 """Facilities for automatically determining files' correct metadata.
 """
-import logging

+from __future__ import division, absolute_import, print_function
+
+from beets import logging
 from beets import config

 # Parts of external interface.
 from .hooks import AlbumInfo, TrackInfo, AlbumMatch, TrackMatch  # noqa
-from .match import tag_item, tag_album  # noqa
+from .match import tag_item, tag_album, Proposal  # noqa
 from .match import Recommendation  # noqa

 # Global logger.
@@ -39,6 +42,16 @@ def apply_item_metadata(item, track_info):
    item.mb_trackid = track_info.track_id
    if track_info.artist_id:
        item.mb_artistid = track_info.artist_id
+    if track_info.data_source:
+        item.data_source = track_info.data_source
+
+    if track_info.lyricist is not None:
+        item.lyricist = track_info.lyricist
+    if track_info.composer is not None:
+        item.composer = track_info.composer
+    if track_info.arranger is not None:
+        item.arranger = track_info.arranger
+
    # At the moment, the other metadata is left intact (including album
    # and track number). Perhaps these should be emptied?

@@ -47,7 +60,7 @@ def apply_metadata(album_info, mapping):
    """Set the items' metadata to match an AlbumInfo object using a
    mapping from Items to TrackInfo objects.
    """
-    for item, track_info in mapping.iteritems():
+    for item, track_info in mapping.items():
        # Album, artist, track count.
        if track_info.artist:
            item.artist = track_info.artist
@@ -90,7 +103,12 @@ def apply_metadata(album_info, mapping):
        item.title = track_info.title

        if config['per_disc_numbering']:
-            item.track = track_info.medium_index or track_info.index
+            # We want to let the track number be zero, but if the medium index
+            # is not provided we need to fall back to the overall index.
+            if track_info.medium_index is not None:
+                item.track = track_info.medium_index
+            else:
+                item.track = track_info.index
            item.tracktotal = track_info.medium_total or len(album_info.tracks)
        else:
            item.track = track_info.index
@@ -122,7 +140,8 @@ def apply_metadata(album_info, mapping):
                      'language',
                      'country',
                      'albumstatus',
-                      'albumdisambig'):
+                      'albumdisambig',
+                      'data_source',):
            value = getattr(album_info, field)
            if value is not None:
                item[field] = value
@@ -132,5 +151,14 @@ def apply_metadata(album_info, mapping):
        if track_info.media is not None:
            item.media = track_info.media

+        if track_info.lyricist is not None:
+            item.lyricist = track_info.lyricist
+        if track_info.composer is not None:
+            item.composer = track_info.composer
+        if track_info.arranger is not None:
+            item.arranger = track_info.arranger
+
+        item.track_alt = track_info.track_alt
+
        # Headphones seal of approval
-        item.comments = 'tagged by headphones/beets'
+        item.comments = 'tagged by headphones/beets'
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -13,15 +14,20 @@
 # included in all copies or substantial portions of the Software.

 """Glue between metadata sources and the matching logic."""
-import logging
+from __future__ import division, absolute_import, print_function
+
 from collections import namedtuple
+from functools import total_ordering
 import re

+from beets import logging
 from beets import plugins
 from beets import config
+from beets.util import as_string
 from beets.autotag import mb
-from beets.util import levenshtein
+from jellyfish import levenshtein_distance
 from unidecode import unidecode
+import six

 log = logging.getLogger('beets')

@@ -101,7 +107,7 @@ class AlbumInfo(object):
    # Work around a bug in python-musicbrainz-ngs that causes some
    # strings to be bytes rather than Unicode.
    # https://github.com/alastair/python-musicbrainz-ngs/issues/85
-    def decode(self, codec='utf8'):
+    def decode(self, codec='utf-8'):
        """Ensure that all string attributes on this object, and the
        constituent `TrackInfo` objects, are decoded to Unicode.
        """
@@ -109,7 +115,7 @@ class AlbumInfo(object):
                    'catalognum', 'script', 'language', 'country',
                    'albumstatus', 'albumdisambig', 'artist_credit', 'media']:
            value = getattr(self, fld)
-            if isinstance(value, str):
+            if isinstance(value, bytes):
                setattr(self, fld, value.decode(codec, 'ignore'))

        if self.tracks:
@@ -134,6 +140,12 @@ class TrackInfo(object):
    - ``artist_sort``: name of the track artist for sorting
    - ``disctitle``: name of the individual medium (subtitle)
    - ``artist_credit``: Recording-specific artist name
+    - ``data_source``: The original data source (MusicBrainz, Discogs, etc.)
+    - ``data_url``: The data source release URL.
+    - ``lyricist``: individual track lyricist name
+    - ``composer``: individual track composer name
+    - ``arranger`: individual track arranger name
+    - ``track_alt``: alternative track number (tape, vinyl, etc.)

    Only ``title`` and ``track_id`` are required. The rest of the fields
    may be None. The indices ``index``, ``medium``, and ``medium_index``
@@ -143,7 +155,8 @@ class TrackInfo(object):
                 length=None, index=None, medium=None, medium_index=None,
                 medium_total=None, artist_sort=None, disctitle=None,
                 artist_credit=None, data_source=None, data_url=None,
-                 media=None):
+                 media=None, lyricist=None, composer=None, arranger=None,
+                 track_alt=None):
        self.title = title
        self.track_id = track_id
        self.artist = artist
@@ -159,16 +172,20 @@ class TrackInfo(object):
        self.artist_credit = artist_credit
        self.data_source = data_source
        self.data_url = data_url
+        self.lyricist = lyricist
+        self.composer = composer
+        self.arranger = arranger
+        self.track_alt = track_alt

    # As above, work around a bug in python-musicbrainz-ngs.
-    def decode(self, codec='utf8'):
+    def decode(self, codec='utf-8'):
        """Ensure that all string attributes on this object are decoded
        to Unicode.
        """
        for fld in ['title', 'artist', 'medium', 'artist_sort', 'disctitle',
                    'artist_credit', 'media']:
            value = getattr(self, fld)
-            if isinstance(value, str):
+            if isinstance(value, bytes):
                setattr(self, fld, value.decode(codec, 'ignore'))


@@ -198,13 +215,15 @@ def _string_dist_basic(str1, str2):
    transliteration/lowering to ASCII characters. Normalized by string
    length.
    """
-    str1 = unidecode(str1)
-    str2 = unidecode(str2)
+    assert isinstance(str1, six.text_type)
+    assert isinstance(str2, six.text_type)
+    str1 = as_string(unidecode(str1))
+    str2 = as_string(unidecode(str2))
    str1 = re.sub(r'[^a-z0-9]', '', str1.lower())
    str2 = re.sub(r'[^a-z0-9]', '', str2.lower())
    if not str1 and not str2:
        return 0.0
-    return levenshtein(str1, str2) / float(max(len(str1), len(str2)))
+    return levenshtein_distance(str1, str2) / float(max(len(str1), len(str2)))


 def string_dist(str1, str2):
@@ -281,6 +300,8 @@ class LazyClassProperty(object):
        return self.value


+@total_ordering
+@six.python_2_unicode_compatible
 class Distance(object):
    """Keeps track of multiple distance penalties. Provides a single
    weighted distance for all penalties as well as a weighted distance
@@ -290,7 +311,7 @@ class Distance(object):
        self._penalties = {}

    @LazyClassProperty
-    def _weights(cls):
+    def _weights(cls):  # noqa
        """A dictionary from keys to floating-point weights.
        """
        weights_view = config['match']['distance_weights']
@@ -316,7 +337,7 @@ class Distance(object):
        """Return the maximum distance penalty (normalization factor).
        """
        dist_max = 0.0
-        for key, penalty in self._penalties.iteritems():
+        for key, penalty in self._penalties.items():
            dist_max += len(penalty) * self._weights[key]
        return dist_max

@@ -325,7 +346,7 @@ class Distance(object):
        """Return the raw (denormalized) distance.
        """
        dist_raw = 0.0
-        for key, penalty in self._penalties.iteritems():
+        for key, penalty in self._penalties.items():
            dist_raw += sum(penalty) * self._weights[key]
        return dist_raw

@@ -342,12 +363,21 @@ class Distance(object):
        # Convert distance into a negative float we can sort items in
        # ascending order (for keys, when the penalty is equal) and
        # still get the items with the biggest distance first.
-        return sorted(list_, key=lambda (key, dist): (0 - dist, key))
+        return sorted(
+            list_,
+            key=lambda key_and_dist: (-key_and_dist[1], key_and_dist[0])
+        )
+
+    def __hash__(self):
+        return id(self)
+
+    def __eq__(self, other):
+        return self.distance == other

    # Behave like a float.

-    def __cmp__(self, other):
-        return cmp(self.distance, other)
+    def __lt__(self, other):
+        return self.distance < other

    def __float__(self):
        return self.distance
@@ -358,6 +388,9 @@ class Distance(object):
    def __rsub__(self, other):
        return other - self.distance

+    def __str__(self):
+        return "{0:.2f}".format(self.distance)
+
    # Behave like a dict.

    def __getitem__(self, key):
@@ -383,9 +416,9 @@ class Distance(object):
        """
        if not isinstance(dist, Distance):
            raise ValueError(
-                '`dist` must be a Distance object, not {0}'.format(type(dist))
+                u'`dist` must be a Distance object, not {0}'.format(type(dist))
            )
-        for key, penalties in dist._penalties.iteritems():
+        for key, penalties in dist._penalties.items():
            self._penalties.setdefault(key, []).extend(penalties)

    # Adding components.
@@ -407,7 +440,7 @@ class Distance(object):
        """
        if not 0.0 <= dist <= 1.0:
            raise ValueError(
-                '`dist` must be between 0.0 and 1.0, not {0}'.format(dist)
+                u'`dist` must be between 0.0 and 1.0, not {0}'.format(dist)
            )
        self._penalties.setdefault(key, []).append(dist)

@@ -516,20 +549,29 @@ def track_for_mbid(recording_id):
        exc.log(log)


+@plugins.notify_info_yielded(u'albuminfo_received')
 def albums_for_id(album_id):
    """Get a list of albums for an ID."""
-    candidates = [album_for_mbid(album_id)]
-    candidates.extend(plugins.album_for_id(album_id))
-    return filter(None, candidates)
+    a = album_for_mbid(album_id)
+    if a:
+        yield a
+    for a in plugins.album_for_id(album_id):
+        if a:
+            yield a


+@plugins.notify_info_yielded(u'trackinfo_received')
 def tracks_for_id(track_id):
    """Get a list of tracks for an ID."""
-    candidates = [track_for_mbid(track_id)]
-    candidates.extend(plugins.track_for_id(track_id))
-    return filter(None, candidates)
+    t = track_for_mbid(track_id)
+    if t:
+        yield t
+    for t in plugins.track_for_id(track_id):
+        if t:
+            yield t


+@plugins.notify_info_yielded(u'albuminfo_received')
 def album_candidates(items, artist, album, va_likely):
    """Search for album matches. ``items`` is a list of Item objects
    that make up the album. ``artist`` and ``album`` are the respective
@@ -537,43 +579,42 @@ def album_candidates(items, artist, album, va_likely):
    entered by the user. ``va_likely`` is a boolean indicating whether
    the album is likely to be a "various artists" release.
    """
-    out = []
-
    # Base candidates if we have album and artist to match.
    if artist and album:
        try:
-            out.extend(mb.match_album(artist, album, len(items)))
+            for candidate in mb.match_album(artist, album, len(items)):
+                yield candidate
        except mb.MusicBrainzAPIError as exc:
            exc.log(log)

    # Also add VA matches from MusicBrainz where appropriate.
    if va_likely and album:
        try:
-            out.extend(mb.match_album(None, album, len(items)))
+            for candidate in mb.match_album(None, album, len(items)):
+                yield candidate
        except mb.MusicBrainzAPIError as exc:
            exc.log(log)

    # Candidates from plugins.
-    out.extend(plugins.candidates(items, artist, album, va_likely))
-
-    return out
+    for candidate in plugins.candidates(items, artist, album, va_likely):
+        yield candidate


+@plugins.notify_info_yielded(u'trackinfo_received')
 def item_candidates(item, artist, title):
    """Search for item matches. ``item`` is the Item to be matched.
    ``artist`` and ``title`` are strings and either reflect the item or
    are specified by the user.
    """
-    out = []

    # MusicBrainz candidates.
    if artist and title:
        try:
-            out.extend(mb.match_track(artist, title))
+            for candidate in mb.match_track(artist, title):
+                yield candidate
        except mb.MusicBrainzAPIError as exc:
            exc.log(log)

    # Plugin candidates.
-    out.extend(plugins.item_candidates(item, artist, title))
-
-    return out
+    for candidate in plugins.item_candidates(item, artist, title):
+        yield candidate
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -15,13 +16,15 @@
 """Matches existing metadata with canonical information to identify
 releases and tracks.
 """
-from __future__ import division
+
+from __future__ import division, absolute_import, print_function

 import datetime
-import logging
 import re
 from munkres import Munkres
+from collections import namedtuple

+from beets import logging
 from beets import plugins
 from beets import config
 from beets.util import plurality
@@ -50,6 +53,13 @@ class Recommendation(OrderedEnum):
    strong = 3


+# A structure for holding a set of possible matches to choose between. This
+# consists of a list of possible candidates (i.e., AlbumInfo or TrackInfo
+# objects) and a recommendation value.
+
+Proposal = namedtuple('Proposal', ('candidates', 'recommendation'))
+
+
 # Primary matching functionality.

 def current_metadata(items):
@@ -93,7 +103,9 @@ def assign_items(items, tracks):
        costs.append(row)

    # Find a minimum-cost bipartite matching.
+    log.debug('Computing track assignment...')
    matching = Munkres().compute(costs)
+    log.debug('...done.')

    # Produce the output matching.
    mapping = dict((items[i], tracks[j]) for (i, j) in matching)
@@ -235,7 +247,7 @@ def distance(items, album_info, mapping):

    # Tracks.
    dist.tracks = {}
-    for item, track in mapping.iteritems():
+    for item, track in mapping.items():
        dist.tracks[track] = track_distance(item, track, album_info.va)
        dist.add('tracks', dist.tracks[track].distance)

@@ -258,19 +270,23 @@ def match_by_id(items):
    AlbumInfo object for the corresponding album. Otherwise, returns
    None.
    """
-    # Is there a consensus on the MB album ID?
-    albumids = [item.mb_albumid for item in items if item.mb_albumid]
-    if not albumids:
-        log.debug(u'No album IDs found.')
+    albumids = (item.mb_albumid for item in items if item.mb_albumid)
+
+    # Did any of the items have an MB album ID?
+    try:
+        first = next(albumids)
+    except StopIteration:
+        log.debug(u'No album ID found.')
        return None

+    # Is there a consensus on the MB album ID?
+    for other in albumids:
+        if other != first:
+            log.debug(u'No album ID consensus.')
+            return None
    # If all album IDs are equal, look up the album.
-    if bool(reduce(lambda x, y: x if x == y else (), albumids)):
-        albumid = albumids[0]
-        log.debug(u'Searching for discovered album ID: {0}'.format(albumid))
-        return hooks.album_for_mbid(albumid)
-    else:
-        log.debug(u'No album ID consensus.')
+    log.debug(u'Searching for discovered album ID: {0}', first)
+    return hooks.album_for_mbid(first)


 def _recommendation(results):
@@ -309,10 +325,10 @@ def _recommendation(results):
    keys = set(min_dist.keys())
    if isinstance(results[0], hooks.AlbumMatch):
        for track_dist in min_dist.tracks.values():
-            keys.update(track_dist.keys())
+            keys.update(list(track_dist.keys()))
    max_rec_view = config['match']['max_rec']
    for key in keys:
-        if key in max_rec_view.keys():
+        if key in list(max_rec_view.keys()):
            max_rec = max_rec_view[key].as_choice({
                'strong': Recommendation.strong,
                'medium': Recommendation.medium,
@@ -324,17 +340,23 @@ def _recommendation(results):
    return rec


+def _sort_candidates(candidates):
+    """Sort candidates by distance."""
+    return sorted(candidates, key=lambda match: match.distance)
+
+
 def _add_candidate(items, results, info):
    """Given a candidate AlbumInfo object, attempt to add the candidate
    to the output dictionary of AlbumMatch objects. This involves
    checking the track count, ordering the items, checking for
    duplicates, and calculating the distance.
    """
-    log.debug(u'Candidate: {0} - {1}'.format(info.artist, info.album))
+    log.debug(u'Candidate: {0} - {1} ({2})',
+              info.artist, info.album, info.album_id)

    # Discard albums with zero tracks.
    if not info.tracks:
-        log.debug('No tracks.')
+        log.debug(u'No tracks.')
        return

    # Don't duplicate.
@@ -345,7 +367,7 @@ def _add_candidate(items, results, info):
    # Discard matches without required tags.
    for req_tag in config['match']['required'].as_str_seq():
        if getattr(info, req_tag) is None:
-            log.debug(u'Ignored. Missing required tag: {0}'.format(req_tag))
+            log.debug(u'Ignored. Missing required tag: {0}', req_tag)
            return

    # Find mapping between the items and the track info.
@@ -355,48 +377,52 @@ def _add_candidate(items, results, info):
    dist = distance(items, info, mapping)

    # Skip matches with ignored penalties.
-    penalties = [key for _, key in dist]
+    penalties = [key for key, _ in dist]
    for penalty in config['match']['ignored'].as_str_seq():
        if penalty in penalties:
-            log.debug(u'Ignored. Penalty: {0}'.format(penalty))
+            log.debug(u'Ignored. Penalty: {0}', penalty)
            return

-    log.debug(u'Success. Distance: {0}'.format(dist))
+    log.debug(u'Success. Distance: {0}', dist)
    results[info.album_id] = hooks.AlbumMatch(dist, info, mapping,
                                              extra_items, extra_tracks)


 def tag_album(items, search_artist=None, search_album=None,
-              search_id=None):
-    """Return a tuple of a artist name, an album name, a list of
-    `AlbumMatch` candidates from the metadata backend, and a
-    `Recommendation`.
+              search_ids=[]):
+    """Return a tuple of the current artist name, the current album
+    name, and a `Proposal` containing `AlbumMatch` candidates.

    The artist and album are the most common values of these fields
    among `items`.

    The `AlbumMatch` objects are generated by searching the metadata
    backends. By default, the metadata of the items is used for the
-    search. This can be customized by setting the parameters. The
-    `mapping` field of the album has the matched `items` as keys.
+    search. This can be customized by setting the parameters.
+    `search_ids` is a list of metadata backend IDs: if specified,
+    it will restrict the candidates to those IDs, ignoring
+    `search_artist` and `search album`. The `mapping` field of the
+    album has the matched `items` as keys.

-    The recommendation is calculated from the match qualitiy of the
+    The recommendation is calculated from the match quality of the
    candidates.
    """
    # Get current metadata.
    likelies, consensus = current_metadata(items)
    cur_artist = likelies['artist']
    cur_album = likelies['album']
-    log.debug(u'Tagging {0} - {1}'.format(cur_artist, cur_album))
+    log.debug(u'Tagging {0} - {1}', cur_artist, cur_album)

    # The output result (distance, AlbumInfo) tuples (keyed by MB album
    # ID).
    candidates = {}

    # Search by explicit ID.
-    if search_id is not None:
-        log.debug(u'Searching for album ID: {0}'.format(search_id))
-        search_cands = hooks.albums_for_id(search_id)
+    if search_ids:
+        for search_id in search_ids:
+            log.debug(u'Searching for album ID: {0}', search_id)
+            for id_candidate in hooks.albums_for_id(search_id):
+                _add_candidate(items, candidates, id_candidate)

    # Use existing metadata or text search.
    else:
@@ -404,81 +430,84 @@ def tag_album(items, search_artist=None, search_album=None,
        id_info = match_by_id(items)
        if id_info:
            _add_candidate(items, candidates, id_info)
-            rec = _recommendation(candidates.values())
-            log.debug(u'Album ID match recommendation is {0}'.format(str(rec)))
+            rec = _recommendation(list(candidates.values()))
+            log.debug(u'Album ID match recommendation is {0}', rec)
            if candidates and not config['import']['timid']:
                # If we have a very good MBID match, return immediately.
                # Otherwise, this match will compete against metadata-based
                # matches.
                if rec == Recommendation.strong:
                    log.debug(u'ID match.')
-                    return cur_artist, cur_album, candidates.values(), rec
+                    return cur_artist, cur_album, \
+                        Proposal(list(candidates.values()), rec)

        # Search terms.
        if not (search_artist and search_album):
            # No explicit search terms -- use current metadata.
            search_artist, search_album = cur_artist, cur_album
-        log.debug(u'Search terms: {0} - {1}'.format(search_artist,
-                                                    search_album))
+        log.debug(u'Search terms: {0} - {1}', search_artist, search_album)

        # Is this album likely to be a "various artist" release?
        va_likely = ((not consensus['artist']) or
                     (search_artist.lower() in VA_ARTISTS) or
                     any(item.comp for item in items))
-        log.debug(u'Album might be VA: {0}'.format(str(va_likely)))
+        log.debug(u'Album might be VA: {0}', va_likely)

        # Get the results from the data sources.
-        search_cands = hooks.album_candidates(items, search_artist,
-                                              search_album, va_likely)
-
-    log.debug(u'Evaluating {0} candidates.'.format(len(search_cands)))
-    for info in search_cands:
-        _add_candidate(items, candidates, info)
+        for matched_candidate in hooks.album_candidates(items,
+                                                        search_artist,
+                                                        search_album,
+                                                        va_likely):
+            _add_candidate(items, candidates, matched_candidate)

+    log.debug(u'Evaluating {0} candidates.', len(candidates))
    # Sort and get the recommendation.
-    candidates = sorted(candidates.itervalues())
+    candidates = _sort_candidates(candidates.values())
    rec = _recommendation(candidates)
-    return cur_artist, cur_album, candidates, rec
+    return cur_artist, cur_album, Proposal(candidates, rec)


 def tag_item(item, search_artist=None, search_title=None,
-             search_id=None):
-    """Attempts to find metadata for a single track. Returns a
-    `(candidates, recommendation)` pair where `candidates` is a list of
-    TrackMatch objects. `search_artist` and `search_title` may be used
+             search_ids=[]):
+    """Find metadata for a single track. Return a `Proposal` consisting
+    of `TrackMatch` objects.
+
+    `search_artist` and `search_title` may be used
    to override the current metadata for the purposes of the MusicBrainz
-    title; likewise `search_id`.
+    title. `search_ids` may be used for restricting the search to a list
+    of metadata backend IDs.
    """
    # Holds candidates found so far: keys are MBIDs; values are
    # (distance, TrackInfo) pairs.
    candidates = {}

    # First, try matching by MusicBrainz ID.
-    trackid = search_id or item.mb_trackid
-    if trackid:
-        log.debug(u'Searching for track ID: {0}'.format(trackid))
-        for track_info in hooks.tracks_for_id(trackid):
-            dist = track_distance(item, track_info, incl_artist=True)
-            candidates[track_info.track_id] = \
-                hooks.TrackMatch(dist, track_info)
-            # If this is a good match, then don't keep searching.
-            rec = _recommendation(candidates.values())
-            if rec == Recommendation.strong and not config['import']['timid']:
-                log.debug(u'Track ID match.')
-                return candidates.values(), rec
+    trackids = search_ids or [t for t in [item.mb_trackid] if t]
+    if trackids:
+        for trackid in trackids:
+            log.debug(u'Searching for track ID: {0}', trackid)
+            for track_info in hooks.tracks_for_id(trackid):
+                dist = track_distance(item, track_info, incl_artist=True)
+                candidates[track_info.track_id] = \
+                    hooks.TrackMatch(dist, track_info)
+                # If this is a good match, then don't keep searching.
+                rec = _recommendation(_sort_candidates(candidates.values()))
+                if rec == Recommendation.strong and \
+                        not config['import']['timid']:
+                    log.debug(u'Track ID match.')
+                    return Proposal(_sort_candidates(candidates.values()), rec)

    # If we're searching by ID, don't proceed.
-    if search_id is not None:
+    if search_ids:
        if candidates:
-            return candidates.values(), rec
+            return Proposal(_sort_candidates(candidates.values()), rec)
        else:
-            return [], Recommendation.none
+            return Proposal([], Recommendation.none)

    # Search terms.
    if not (search_artist and search_title):
        search_artist, search_title = item.artist, item.title
-    log.debug(u'Item search terms: {0} - {1}'.format(search_artist,
-                                                     search_title))
+    log.debug(u'Item search terms: {0} - {1}', search_artist, search_title)

    # Get and evaluate candidate metadata.
    for track_info in hooks.item_candidates(item, search_artist, search_title):
@@ -486,7 +515,7 @@ def tag_item(item, search_artist=None, search_title=None,
        candidates[track_info.track_id] = hooks.TrackMatch(dist, track_info)

    # Sort by distance and return with recommendation.
-    log.debug(u'Found {0} candidates.'.format(len(candidates)))
-    candidates = sorted(candidates.itervalues())
+    log.debug(u'Found {0} candidates.', len(candidates))
+    candidates = _sort_candidates(candidates.values())
    rec = _recommendation(candidates)
-    return candidates, rec
+    return Proposal(candidates, rec)
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,23 +15,29 @@

 """Searches for albums in the MusicBrainz database.
 """
-import logging
+from __future__ import division, absolute_import, print_function
+
 import musicbrainzngs
 import re
 import traceback
-from urlparse import urljoin
+from six.moves.urllib.parse import urljoin

+from beets import logging
 import beets.autotag.hooks
 import beets
 from beets import util
 from beets import config
+import six

-SEARCH_LIMIT = 5
 VARIOUS_ARTISTS_ID = '89ad4ac3-39f7-470e-963a-56509c546377'
-BASE_URL = 'http://musicbrainz.org/'
+
+if util.SNI_SUPPORTED:
+    BASE_URL = 'https://musicbrainz.org/'
+else:
+    BASE_URL = 'http://musicbrainz.org/'

 musicbrainzngs.set_useragent('beets', beets.__version__,
-                             'http://beets.radbox.org/')
+                             'http://beets.io/')


 class MusicBrainzAPIError(util.HumanReadableException):
@@ -39,6 +46,8 @@ class MusicBrainzAPIError(util.HumanReadableException):
    """
    def __init__(self, reason, verb, query, tb=None):
        self.query = query
+        if isinstance(reason, musicbrainzngs.WebServiceError):
+            reason = u'MusicBrainz not reachable'
        super(MusicBrainzAPIError, self).__init__(reason, verb, tb)

    def get_message(self):
@@ -49,8 +58,12 @@ class MusicBrainzAPIError(util.HumanReadableException):
 log = logging.getLogger('beets')

 RELEASE_INCLUDES = ['artists', 'media', 'recordings', 'release-groups',
-                    'labels', 'artist-credits', 'aliases']
+                    'labels', 'artist-credits', 'aliases',
+                    'recording-level-rels', 'work-rels',
+                    'work-level-rels', 'artist-rels']
 TRACK_INCLUDES = ['artists', 'aliases']
+if 'work-level-rels' in musicbrainzngs.VALID_INCLUDES['recording']:
+    TRACK_INCLUDES += ['work-level-rels', 'artist-rels']


 def track_url(trackid):
@@ -65,7 +78,8 @@ def configure():
    """Set up the python-musicbrainz-ngs module according to settings
    from the beets configuration. This should be called at startup.
    """
-    musicbrainzngs.set_hostname(config['musicbrainz']['host'].get(unicode))
+    hostname = config['musicbrainz']['host'].as_str()
+    musicbrainzngs.set_hostname(hostname)
    musicbrainzngs.set_rate_limit(
        config['musicbrainz']['ratelimit_interval'].as_number(),
        config['musicbrainz']['ratelimit'].get(int),
@@ -104,7 +118,7 @@ def _flatten_artist_credit(credit):
    artist_sort_parts = []
    artist_credit_parts = []
    for el in credit:
-        if isinstance(el, basestring):
+        if isinstance(el, six.string_types):
            # Join phrase.
            artist_parts.append(el)
            artist_credit_parts.append(el)
@@ -157,6 +171,7 @@ def track_info(recording, index=None, medium=None, medium_index=None,
        medium=medium,
        medium_index=medium_index,
        medium_total=medium_total,
+        data_source=u'MusicBrainz',
        data_url=track_url(recording['id']),
    )

@@ -172,6 +187,33 @@ def track_info(recording, index=None, medium=None, medium_index=None,
    if recording.get('length'):
        info.length = int(recording['length']) / (1000.0)

+    lyricist = []
+    composer = []
+    for work_relation in recording.get('work-relation-list', ()):
+        if work_relation['type'] != 'performance':
+            continue
+        for artist_relation in work_relation['work'].get(
+                'artist-relation-list', ()):
+            if 'type' in artist_relation:
+                type = artist_relation['type']
+                if type == 'lyricist':
+                    lyricist.append(artist_relation['artist']['name'])
+                elif type == 'composer':
+                    composer.append(artist_relation['artist']['name'])
+    if lyricist:
+        info.lyricist = u', '.join(lyricist)
+    if composer:
+        info.composer = u', '.join(composer)
+
+    arranger = []
+    for artist_relation in recording.get('artist-relation-list', ()):
+        if 'type' in artist_relation:
+            type = artist_relation['type']
+            if type == 'arranger':
+                arranger.append(artist_relation['artist']['name'])
+    if arranger:
+        info.arranger = u', '.join(arranger)
+
    info.decode()
    return info

@@ -210,7 +252,12 @@ def album_info(release):
    for medium in release['medium-list']:
        disctitle = medium.get('title')
        format = medium.get('format')
-        for track in medium['track-list']:
+
+        all_tracks = medium['track-list']
+        if 'pregap' in medium:
+            all_tracks.insert(0, medium['pregap'])
+
+        for track in all_tracks:
            # Basic information from the recording.
            index += 1
            ti = track_info(
@@ -222,6 +269,7 @@ def album_info(release):
            )
            ti.disctitle = disctitle
            ti.media = format
+            ti.track_alt = track['number']

            # Prefer track data, where present, over recording data.
            if track.get('title'):
@@ -245,10 +293,12 @@ def album_info(release):
        mediums=len(release['medium-list']),
        artist_sort=artist_sort_name,
        artist_credit=artist_credit_name,
-        data_source='MusicBrainz',
+        data_source=u'MusicBrainz',
        data_url=album_url(release['id']),
    )
    info.va = info.artist_id == VARIOUS_ARTISTS_ID
+    if info.va:
+        info.artist = config['va_name'].as_str()
    info.asin = release.get('asin')
    info.releasegroup_id = release['release-group']['id']
    info.country = release.get('country')
@@ -301,7 +351,7 @@ def album_info(release):
    return info


-def match_album(artist, album, tracks=None, limit=SEARCH_LIMIT):
+def match_album(artist, album, tracks=None):
    """Searches for a single album ("release" in MusicBrainz parlance)
    and returns an iterator over AlbumInfo objects. May raise a
    MusicBrainzAPIError.
@@ -317,14 +367,16 @@ def match_album(artist, album, tracks=None, limit=SEARCH_LIMIT):
        # Various Artists search.
        criteria['arid'] = VARIOUS_ARTISTS_ID
    if tracks is not None:
-        criteria['tracks'] = str(tracks)
+        criteria['tracks'] = six.text_type(tracks)

    # Abort if we have no search terms.
-    if not any(criteria.itervalues()):
+    if not any(criteria.values()):
        return

    try:
-        res = musicbrainzngs.search_releases(limit=limit, **criteria)
+        log.debug(u'Searching for MusicBrainz releases with: {!r}', criteria)
+        res = musicbrainzngs.search_releases(
+            limit=config['musicbrainz']['searchlimit'].get(int), **criteria)
    except musicbrainzngs.MusicBrainzError as exc:
        raise MusicBrainzAPIError(exc, 'release search', criteria,
                                  traceback.format_exc())
@@ -336,7 +388,7 @@ def match_album(artist, album, tracks=None, limit=SEARCH_LIMIT):
            yield albuminfo


-def match_track(artist, title, limit=SEARCH_LIMIT):
+def match_track(artist, title):
    """Searches for a single track and returns an iterable of TrackInfo
    objects. May raise a MusicBrainzAPIError.
    """
@@ -345,11 +397,12 @@ def match_track(artist, title, limit=SEARCH_LIMIT):
        'recording': title.lower().strip(),
    }

-    if not any(criteria.itervalues()):
+    if not any(criteria.values()):
        return

    try:
-        res = musicbrainzngs.search_recordings(limit=limit, **criteria)
+        res = musicbrainzngs.search_recordings(
+            limit=config['musicbrainz']['searchlimit'].get(int), **criteria)
    except musicbrainzngs.MusicBrainzError as exc:
        raise MusicBrainzAPIError(exc, 'recording search', criteria,
                                  traceback.format_exc())
@@ -362,7 +415,7 @@ def _parse_id(s):
    no ID can be found, return None.
    """
    # Find the first thing that looks like a UUID/MBID.
-    match = re.search('[a-f0-9]{8}(-[a-f0-9]{4}){3}-[a-f0-9]{12}', s)
+    match = re.search(u'[a-f0-9]{8}(-[a-f0-9]{4}){3}-[a-f0-9]{12}', s)
    if match:
        return match.group()

@@ -372,9 +425,10 @@ def album_for_id(releaseid):
    object or None if the album is not found. May raise a
    MusicBrainzAPIError.
    """
+    log.debug(u'Requesting MusicBrainz release {}', releaseid)
    albumid = _parse_id(releaseid)
    if not albumid:
-        log.debug(u'Invalid MBID ({0}).'.format(releaseid))
+        log.debug(u'Invalid MBID ({0}).', releaseid)
        return
    try:
        res = musicbrainzngs.get_release_by_id(albumid,
@@ -383,7 +437,7 @@ def album_for_id(releaseid):
        log.debug(u'Album ID match failed.')
        return None
    except musicbrainzngs.MusicBrainzError as exc:
-        raise MusicBrainzAPIError(exc, 'get release by ID', albumid,
+        raise MusicBrainzAPIError(exc, u'get release by ID', albumid,
                                  traceback.format_exc())
    return album_info(res['release'])

@@ -394,7 +448,7 @@ def track_for_id(releaseid):
    """
    trackid = _parse_id(releaseid)
    if not trackid:
-        log.debug(u'Invalid MBID ({0}).'.format(releaseid))
+        log.debug(u'Invalid MBID ({0}).', releaseid)
        return
    try:
        res = musicbrainzngs.get_recording_by_id(trackid, TRACK_INCLUDES)
@@ -402,6 +456,6 @@ def track_for_id(releaseid):
        log.debug(u'Track ID match failed.')
        return None
    except musicbrainzngs.MusicBrainzError as exc:
-        raise MusicBrainzAPIError(exc, 'get recording by ID', trackid,
+        raise MusicBrainzAPIError(exc, u'get recording by ID', trackid,
                                  traceback.format_exc())
    return track_info(res['recording'])
@@ -6,6 +6,7 @@ import:
    copy: yes
    move: no
    link: no
+    hardlink: no
    delete: no
    resume: ask
    incremental: no
@@ -22,9 +23,13 @@ import:
    flat: no
    group_albums: no
    pretend: false
+    search_ids: []
+    duplicate_action: ask

 clutter: ["Thumbs.DB", ".DS_Store"]
-ignore: [".*", "*~", "System Volume Information"]
+ignore: [".*", "*~", "System Volume Information", "lost+found"]
+ignore_hidden: yes
+
 replace:
    '[\\/]': _
    '^\.': _
@@ -41,24 +46,35 @@ max_filename_length: 0
 plugins: []
 pluginpath: []
 threaded: yes
-color: yes
 timeout: 5.0
 per_disc_numbering: no
-verbose: no
-terminal_encoding: utf8
+verbose: 0
+terminal_encoding:
 original_date: no
 id3v23: no
+va_name: "Various Artists"

 ui:
    terminal_width: 80
    length_diff_thresh: 10.0
+    color: yes
+    colors:
+        text_success: green
+        text_warning: yellow
+        text_error: red
+        text_highlight: red
+        text_highlight_minor: lightgray
+        action_default: turquoise
+        action: blue

-list_format_item: $artist - $album - $title
-list_format_album: $albumartist - $album
+format_item: $artist - $album - $title
+format_album: $albumartist - $album
 time_format: '%Y-%m-%d %H:%M:%S'
+format_raw_length: no

 sort_album: albumartist+ album+
 sort_item: artist+ album+ disc+ track+
+sort_case_insensitive: yes

 paths:
    default: $albumartist/$album%aunique{}/$track $title
@@ -71,6 +87,7 @@ musicbrainz:
    host: musicbrainz.org
    ratelimit: 1
    ratelimit_interval: 1.0
+    searchlimit: 5

 match:
    strong_rec_thresh: 0.04
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -15,11 +16,14 @@
 """DBCore is an abstract database package that forms the basis for beets'
 Library.
 """
+from __future__ import division, absolute_import, print_function
+
 from .db import Model, Database
 from .query import Query, FieldQuery, MatchQuery, AndQuery, OrQuery
 from .types import Type
 from .queryparse import query_from_strings
 from .queryparse import sort_from_strings
 from .queryparse import parse_sorted_query
+from .query import InvalidQueryError

 # flake8: noqa
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,6 +15,8 @@

 """The central Model and Database constructs for DBCore.
 """
+from __future__ import division, absolute_import, print_function
+
 import time
 import os
 from collections import defaultdict
@@ -24,14 +27,16 @@ import collections

 import beets
 from beets.util.functemplate import Template
+from beets.util import py3_path
 from beets.dbcore import types
 from .query import MatchQuery, NullSort, TrueQuery
+import six


 class FormattedMapping(collections.Mapping):
    """A `dict`-like formatted view of a model.

-    The accessor `mapping[key]` returns the formated version of
+    The accessor `mapping[key]` returns the formatted version of
    `model[key]` as a unicode string.

    If `for_path` is true, all path separators in the formatted values
@@ -63,10 +68,10 @@ class FormattedMapping(collections.Mapping):
    def _get_formatted(self, model, key):
        value = model._type(key).format(model.get(key))
        if isinstance(value, bytes):
-            value = value.decode('utf8', 'ignore')
+            value = value.decode('utf-8', 'ignore')

        if self.for_path:
-            sep_repl = beets.config['path_sep_replace'].get(unicode)
+            sep_repl = beets.config['path_sep_replace'].as_str()
            for sep in (os.path.sep, os.path.altsep):
                if sep:
                    value = value.replace(sep, sep_repl)
@@ -173,9 +178,9 @@ class Model(object):
        ordinary construction are bypassed.
        """
        obj = cls(db)
-        for key, value in fixed_values.iteritems():
+        for key, value in fixed_values.items():
            obj._values_fixed[key] = cls._type(key).from_sql(value)
-        for key, value in flex_values.iteritems():
+        for key, value in flex_values.items():
            obj._values_flex[key] = cls._type(key).from_sql(value)
        return obj

@@ -197,20 +202,22 @@ class Model(object):
        exception is raised otherwise.
        """
        if not self._db:
-            raise ValueError('{0} has no database'.format(type(self).__name__))
+            raise ValueError(
+                u'{0} has no database'.format(type(self).__name__)
+            )
        if need_id and not self.id:
-            raise ValueError('{0} has no id'.format(type(self).__name__))
+            raise ValueError(u'{0} has no id'.format(type(self).__name__))

    # Essential field accessors.

    @classmethod
-    def _type(self, key):
+    def _type(cls, key):
        """Get the type of a field, a `Type` instance.

        If the field has no explicit type, it is given the base `Type`,
        which does no conversion.
        """
-        return self._fields.get(key) or self._types.get(key) or types.DEFAULT
+        return cls._fields.get(key) or cls._types.get(key) or types.DEFAULT

    def __getitem__(self, key):
        """Get the value for a field. Raise a KeyError if the field is
@@ -251,23 +258,30 @@ class Model(object):
            del self._values_flex[key]
            self._dirty.add(key)  # Mark for dropping on store.
        elif key in self._getters():  # Computed.
-            raise KeyError('computed field {0} cannot be deleted'.format(key))
+            raise KeyError(u'computed field {0} cannot be deleted'.format(key))
        elif key in self._fields:  # Fixed.
-            raise KeyError('fixed field {0} cannot be deleted'.format(key))
+            raise KeyError(u'fixed field {0} cannot be deleted'.format(key))
        else:
-            raise KeyError('no such field {0}'.format(key))
+            raise KeyError(u'no such field {0}'.format(key))

    def keys(self, computed=False):
        """Get a list of available field names for this object. The
        `computed` parameter controls whether computed (plugin-provided)
        fields are included in the key list.
        """
-        base_keys = list(self._fields) + self._values_flex.keys()
+        base_keys = list(self._fields) + list(self._values_flex.keys())
        if computed:
-            return base_keys + self._getters().keys()
+            return base_keys + list(self._getters().keys())
        else:
            return base_keys

+    @classmethod
+    def all_keys(cls):
+        """Get a list of available keys for objects of this type.
+        Includes fixed and computed fields.
+        """
+        return list(cls._fields) + list(cls._getters().keys())
+
    # Act like a dictionary.

    def update(self, values):
@@ -307,12 +321,12 @@ class Model(object):

    def __getattr__(self, key):
        if key.startswith('_'):
-            raise AttributeError('model has no attribute {0!r}'.format(key))
+            raise AttributeError(u'model has no attribute {0!r}'.format(key))
        else:
            try:
                return self[key]
            except KeyError:
-                raise AttributeError('no such field {0!r}'.format(key))
+                raise AttributeError(u'no such field {0!r}'.format(key))

    def __setattr__(self, key, value):
        if key.startswith('_'):
@@ -328,15 +342,19 @@ class Model(object):

    # Database interaction (CRUD methods).

-    def store(self):
+    def store(self, fields=None):
        """Save the object's metadata into the library database.
+        :param fields: the fields to be stored. If not specified, all fields
+        will be.
        """
+        if fields is None:
+            fields = self._fields
        self._check_db()

        # Build assignments for query.
        assignments = []
        subvars = []
-        for key in self._fields:
+        for key in fields:
            if key != 'id' and key in self._dirty:
                self._dirty.remove(key)
                assignments.append(key + '=?')
@@ -379,7 +397,7 @@ class Model(object):
        """
        self._check_db()
        stored_obj = self._db._get(type(self), self.id)
-        assert stored_obj is not None, "object {0} not in DB".format(self.id)
+        assert stored_obj is not None, u"object {0} not in DB".format(self.id)
        self._values_fixed = {}
        self._values_flex = {}
        self.update(dict(stored_obj))
@@ -440,7 +458,7 @@ class Model(object):
        separators will be added to the template.
        """
        # Perform substitution.
-        if isinstance(template, basestring):
+        if isinstance(template, six.string_types):
            template = Template(template)
        return template.substitute(self.formatted(for_path),
                                   self._template_funcs())
@@ -451,11 +469,16 @@ class Model(object):
    def _parse(cls, key, string):
        """Parse a string as a value for the given key.
        """
-        if not isinstance(string, basestring):
-            raise TypeError("_parse() argument must be a string")
+        if not isinstance(string, six.string_types):
+            raise TypeError(u"_parse() argument must be a string")

        return cls._type(key).parse(string)

+    def set_parse(self, key, string):
+        """Set the object's key to a value represented by a string.
+        """
+        self[key] = self._parse(key, string)
+

 # Database controller and supporting interfaces.

@@ -576,6 +599,11 @@ class Results(object):
            return self._row_count

    def __nonzero__(self):
+        """Does this result contain any objects?
+        """
+        return self.__bool__()
+
+    def __bool__(self):
        """Does this result contain any objects?
        """
        return bool(len(self))
@@ -592,10 +620,10 @@ class Results(object):
        it = iter(self)
        try:
            for i in range(n):
-                it.next()
-            return it.next()
+                next(it)
+            return next(it)
        except StopIteration:
-            raise IndexError('result index {0} out of range'.format(n))
+            raise IndexError(u'result index {0} out of range'.format(n))

    def get(self):
        """Return the first matching object, or None if no objects
@@ -603,7 +631,7 @@ class Results(object):
        """
        it = iter(self)
        try:
-            return it.next()
+            return next(it)
        except StopIteration:
            return None

@@ -668,8 +696,9 @@ class Database(object):
    """The Model subclasses representing tables in this database.
    """

-    def __init__(self, path):
+    def __init__(self, path, timeout=5.0):
        self.path = path
+        self.timeout = timeout

        self._connections = {}
        self._tx_stacks = defaultdict(list)
@@ -704,18 +733,36 @@ class Database(object):
            if thread_id in self._connections:
                return self._connections[thread_id]
            else:
-                # Make a new connection.
-                conn = sqlite3.connect(
-                    self.path,
-                    timeout=beets.config['timeout'].as_number(),
-                )
-
-                # Access SELECT results like dictionaries.
-                conn.row_factory = sqlite3.Row
-
+                conn = self._create_connection()
                self._connections[thread_id] = conn
                return conn

+    def _create_connection(self):
+        """Create a SQLite connection to the underlying database.
+
+        Makes a new connection every time. If you need to configure the
+        connection settings (e.g., add custom functions), override this
+        method.
+        """
+        # Make a new connection. The `sqlite3` module can't use
+        # bytestring paths here on Python 3, so we need to
+        # provide a `str` using `py3_path`.
+        conn = sqlite3.connect(
+            py3_path(self.path), timeout=self.timeout
+        )
+
+        # Access SELECT results like dictionaries.
+        conn.row_factory = sqlite3.Row
+        return conn
+
+    def _close(self):
+        """Close the all connections to the underlying SQLite database
+        from all threads. This does not render the database object
+        unusable; new connections can still be opened on demand.
+        """
+        with self._shared_map_lock:
+            self._connections.clear()
+
    @contextlib.contextmanager
    def _tx_stack(self):
        """A context manager providing access to the current thread's
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,10 +15,49 @@

 """The Query type hierarchy for DBCore.
 """
+from __future__ import division, absolute_import, print_function
+
 import re
-from operator import attrgetter
+from operator import mul
 from beets import util
 from datetime import datetime, timedelta
+import unicodedata
+from functools import reduce
+import six
+
+if not six.PY2:
+    buffer = memoryview  # sqlite won't accept memoryview in python 2
+
+
+class ParsingError(ValueError):
+    """Abstract class for any unparseable user-requested album/query
+    specification.
+    """
+
+
+class InvalidQueryError(ParsingError):
+    """Represent any kind of invalid query.
+
+    The query should be a unicode string or a list, which will be space-joined.
+    """
+    def __init__(self, query, explanation):
+        if isinstance(query, list):
+            query = " ".join(query)
+        message = u"'{0}': {1}".format(query, explanation)
+        super(InvalidQueryError, self).__init__(message)
+
+
+class InvalidQueryArgumentTypeError(ParsingError):
+    """Represent a query argument that could not be converted as expected.
+
+    It exists to be caught in upper stack levels so a meaningful (i.e. with the
+    query) InvalidQueryError can be raised.
+    """
+    def __init__(self, what, expected, detail=None):
+        message = u"'{0}' is not {1}".format(what, expected)
+        if detail:
+            message = u"{0}: {1}".format(message, detail)
+        super(InvalidQueryArgumentTypeError, self).__init__(message)


 class Query(object):
@@ -25,9 +65,8 @@ class Query(object):
    """
    def clause(self):
        """Generate an SQLite expression implementing the query.
-        Return a clause string, a sequence of substitution values for
-        the clause, and a Query object representing the "remainder"
-        Returns (clause, subvals) where clause is a valid sqlite
+
+        Return (clause, subvals) where clause is a valid sqlite
        WHERE clause implementing the query and subvals is a list of
        items to be substituted for ?s in the clause.
        """
@@ -39,6 +78,15 @@ class Query(object):
        """
        raise NotImplementedError

+    def __repr__(self):
+        return "{0.__class__.__name__}()".format(self)
+
+    def __eq__(self, other):
+        return type(self) == type(other)
+
+    def __hash__(self):
+        return 0
+

 class FieldQuery(Query):
    """An abstract query that searches in a specific field for a
@@ -72,6 +120,17 @@ class FieldQuery(Query):
    def match(self, item):
        return self.value_match(self.pattern, item.get(self.field))

+    def __repr__(self):
+        return ("{0.__class__.__name__}({0.field!r}, {0.pattern!r}, "
+                "{0.fast})".format(self))
+
+    def __eq__(self, other):
+        return super(FieldQuery, self).__eq__(other) and \
+            self.field == other.field and self.pattern == other.pattern
+
+    def __hash__(self):
+        return hash((self.field, hash(self.pattern)))
+

 class MatchQuery(FieldQuery):
    """A query that looks for exact matches in an item field."""
@@ -86,19 +145,21 @@ class MatchQuery(FieldQuery):
 class NoneQuery(FieldQuery):

    def __init__(self, field, fast=True):
-        self.field = field
-        self.fast = fast
+        super(NoneQuery, self).__init__(field, None, fast)

    def col_clause(self):
        return self.field + " IS NULL", ()

    @classmethod
-    def match(self, item):
+    def match(cls, item):
        try:
-            return item[self.field] is None
+            return item[cls.field] is None
        except KeyError:
            return True

+    def __repr__(self):
+        return "{0.__class__.__name__}({0.field!r}, {0.fast})".format(self)
+

 class StringFieldQuery(FieldQuery):
    """A FieldQuery that converts values to strings before matching
@@ -139,15 +200,31 @@ class SubstringQuery(StringFieldQuery):
 class RegexpQuery(StringFieldQuery):
    """A query that matches a regular expression in a specific item
    field.
+
+    Raises InvalidQueryError when the pattern is not a valid regular
+    expression.
    """
+    def __init__(self, field, pattern, fast=True):
+        super(RegexpQuery, self).__init__(field, pattern, fast)
+        pattern = self._normalize(pattern)
+        try:
+            self.pattern = re.compile(self.pattern)
+        except re.error as exc:
+            # Invalid regular expression.
+            raise InvalidQueryArgumentTypeError(pattern,
+                                                u"a regular expression",
+                                                format(exc))
+
+    @staticmethod
+    def _normalize(s):
+        """Normalize a Unicode string's representation (used on both
+        patterns and matched values).
+        """
+        return unicodedata.normalize('NFC', s)
+
    @classmethod
    def string_match(cls, pattern, value):
-        try:
-            res = re.search(pattern, value)
-        except re.error:
-            # Invalid regular expression.
-            return False
-        return res is not None
+        return pattern.search(cls._normalize(value)) is not None


 class BooleanQuery(MatchQuery):
@@ -156,28 +233,26 @@ class BooleanQuery(MatchQuery):
    """
    def __init__(self, field, pattern, fast=True):
        super(BooleanQuery, self).__init__(field, pattern, fast)
-        if isinstance(pattern, basestring):
+        if isinstance(pattern, six.string_types):
            self.pattern = util.str2bool(pattern)
        self.pattern = int(self.pattern)


 class BytesQuery(MatchQuery):
    """Match a raw bytes field (i.e., a path). This is a necessary hack
-    to work around the `sqlite3` module's desire to treat `str` and
+    to work around the `sqlite3` module's desire to treat `bytes` and
    `unicode` equivalently in Python 2. Always use this query instead of
    `MatchQuery` when matching on BLOB values.
    """
    def __init__(self, field, pattern):
        super(BytesQuery, self).__init__(field, pattern)

-        # Use a buffer representation of the pattern for SQLite
+        # Use a buffer/memoryview representation of the pattern for SQLite
        # matching. This instructs SQLite to treat the blob as binary
        # rather than encoded Unicode.
-        if isinstance(self.pattern, basestring):
-            # Implicitly coerce Unicode strings to their bytes
-            # equivalents.
-            if isinstance(self.pattern, unicode):
-                self.pattern = self.pattern.encode('utf8')
+        if isinstance(self.pattern, (six.text_type, bytes)):
+            if isinstance(self.pattern, six.text_type):
+                self.pattern = self.pattern.encode('utf-8')
            self.buf_pattern = buffer(self.pattern)
        elif isinstance(self.pattern, buffer):
            self.buf_pattern = self.pattern
@@ -191,19 +266,26 @@ class NumericQuery(FieldQuery):
    """Matches numeric fields. A syntax using Ruby-style range ellipses
    (``..``) lets users specify one- or two-sided ranges. For example,
    ``year:2001..`` finds music released since the turn of the century.
+
+    Raises InvalidQueryError when the pattern does not represent an int or
+    a float.
    """
    def _convert(self, s):
-        """Convert a string to a numeric type (float or int). If the
-        string cannot be converted, return None.
+        """Convert a string to a numeric type (float or int).
+
+        Return None if `s` is empty.
+        Raise an InvalidQueryError if the string cannot be converted.
        """
        # This is really just a bit of fun premature optimization.
+        if not s:
+            return None
        try:
            return int(s)
        except ValueError:
            try:
                return float(s)
            except ValueError:
-                return None
+                raise InvalidQueryArgumentTypeError(s, u"an int or a float")

    def __init__(self, field, pattern, fast=True):
        super(NumericQuery, self).__init__(field, pattern, fast)
@@ -224,7 +306,7 @@ class NumericQuery(FieldQuery):
        if self.field not in item:
            return False
        value = item[self.field]
-        if isinstance(value, basestring):
+        if isinstance(value, six.string_types):
            value = self._convert(value)

        if self.point is not None:
@@ -248,7 +330,7 @@ class NumericQuery(FieldQuery):
            elif self.rangemax is not None:
                return u'{0} <= ?'.format(self.field), (self.rangemax,)
            else:
-                return '1', ()
+                return u'1', ()


 class CollectionQuery(Query):
@@ -273,7 +355,7 @@ class CollectionQuery(Query):
        return item in self.subqueries

    def clause_with_joiner(self, joiner):
-        """Returns a clause created by joining together the clauses of
+        """Return a clause created by joining together the clauses of
        all subqueries with the string joiner (padded by spaces).
        """
        clause_parts = []
@@ -288,6 +370,19 @@ class CollectionQuery(Query):
        clause = (' ' + joiner + ' ').join(clause_parts)
        return clause, subvals

+    def __repr__(self):
+        return "{0.__class__.__name__}({0.subqueries!r})".format(self)
+
+    def __eq__(self, other):
+        return super(CollectionQuery, self).__eq__(other) and \
+            self.subqueries == other.subqueries
+
+    def __hash__(self):
+        """Since subqueries are mutable, this object should not be hashable.
+        However and for conveniences purposes, it can be hashed.
+        """
+        return reduce(mul, map(hash, self.subqueries), 1)
+

 class AnyFieldQuery(CollectionQuery):
    """A query that matches if a given FieldQuery subclass matches in
@@ -313,6 +408,17 @@ class AnyFieldQuery(CollectionQuery):
                return True
        return False

+    def __repr__(self):
+        return ("{0.__class__.__name__}({0.pattern!r}, {0.fields!r}, "
+                "{0.query_class.__name__})".format(self))
+
+    def __eq__(self, other):
+        return super(AnyFieldQuery, self).__eq__(other) and \
+            self.query_class == other.query_class
+
+    def __hash__(self):
+        return hash((self.pattern, tuple(self.fields), self.query_class))
+

 class MutableCollectionQuery(CollectionQuery):
    """A collection query whose subqueries may be modified after the
@@ -343,6 +449,36 @@ class OrQuery(MutableCollectionQuery):
        return any([q.match(item) for q in self.subqueries])


+class NotQuery(Query):
+    """A query that matches the negation of its `subquery`, as a shorcut for
+    performing `not(subquery)` without using regular expressions.
+    """
+    def __init__(self, subquery):
+        self.subquery = subquery
+
+    def clause(self):
+        clause, subvals = self.subquery.clause()
+        if clause:
+            return 'not ({0})'.format(clause), subvals
+        else:
+            # If there is no clause, there is nothing to negate. All the logic
+            # is handled by match() for slow queries.
+            return clause, subvals
+
+    def match(self, item):
+        return not self.subquery.match(item)
+
+    def __repr__(self):
+        return "{0.__class__.__name__}({0.subquery!r})".format(self)
+
+    def __eq__(self, other):
+        return super(NotQuery, self).__eq__(other) and \
+            self.subquery == other.subquery
+
+    def __hash__(self):
+        return hash(('not', hash(self.subquery)))
+
+
 class TrueQuery(Query):
    """A query that always matches."""
    def clause(self):
@@ -367,13 +503,13 @@ def _to_epoch_time(date):
    """Convert a `datetime` object to an integer number of seconds since
    the (local) Unix epoch.
    """
-    epoch = datetime.fromtimestamp(0)
-    delta = date - epoch
-    try:
+    if hasattr(date, 'timestamp'):
+        # The `timestamp` method exists on Python 3.3+.
+        return int(date.timestamp())
+    else:
+        epoch = datetime.fromtimestamp(0)
+        delta = date - epoch
        return int(delta.total_seconds())
-    except AttributeError:
-        # datetime.timedelta.total_seconds() is not available on Python 2.6
-        return delta.seconds + delta.days * 24 * 3600


 def _parse_periods(pattern):
@@ -405,7 +541,7 @@ class Period(object):
        precision (a string, one of "year", "month", or "day").
        """
        if precision not in Period.precisions:
-            raise ValueError('Invalid precision ' + str(precision))
+            raise ValueError(u'Invalid precision {0}'.format(precision))
        self.date = date
        self.precision = precision

@@ -445,7 +581,7 @@ class Period(object):
        elif 'day' == precision:
            return date + timedelta(days=1)
        else:
-            raise ValueError('unhandled precision ' + str(precision))
+            raise ValueError(u'unhandled precision {0}'.format(precision))


 class DateInterval(object):
@@ -457,7 +593,7 @@ class DateInterval(object):

    def __init__(self, start, end):
        if start is not None and end is not None and not start < end:
-            raise ValueError("start date {0} is not before end date {1}"
+            raise ValueError(u"start date {0} is not before end date {1}"
                             .format(start, end))
        self.start = start
        self.end = end
@@ -478,7 +614,7 @@ class DateInterval(object):
        return True

    def __str__(self):
-        return'[{0}, {1})'.format(self.start, self.end)
+        return '[{0}, {1})'.format(self.start, self.end)


 class DateQuery(FieldQuery):
@@ -496,6 +632,8 @@ class DateQuery(FieldQuery):
        self.interval = DateInterval.from_periods(start, end)

    def match(self, item):
+        if self.field not in item:
+            return False
        timestamp = float(item[self.field])
        date = datetime.utcfromtimestamp(timestamp)
        return self.interval.contains(date)
@@ -523,6 +661,33 @@ class DateQuery(FieldQuery):
        return clause, subvals


+class DurationQuery(NumericQuery):
+    """NumericQuery that allow human-friendly (M:SS) time interval formats.
+
+    Converts the range(s) to a float value, and delegates on NumericQuery.
+
+    Raises InvalidQueryError when the pattern does not represent an int, float
+    or M:SS time interval.
+    """
+    def _convert(self, s):
+        """Convert a M:SS or numeric string to a float.
+
+        Return None if `s` is empty.
+        Raise an InvalidQueryError if the string cannot be converted.
+        """
+        if not s:
+            return None
+        try:
+            return util.raw_seconds_short(s)
+        except ValueError:
+            try:
+                return float(s)
+            except ValueError:
+                raise InvalidQueryArgumentTypeError(
+                    s,
+                    u"a M:SS string or a float")
+
+
 # Sorting.

 class Sort(object):
@@ -547,6 +712,12 @@ class Sort(object):
        """
        return False

+    def __hash__(self):
+        return 0
+
+    def __eq__(self, other):
+        return type(self) == type(other)
+

 class MultipleSort(Sort):
    """Sort that encapsulates multiple sub-sorts.
@@ -606,38 +777,67 @@ class MultipleSort(Sort):
        return items

    def __repr__(self):
-        return u'MultipleSort({0})'.format(repr(self.sorts))
+        return 'MultipleSort({!r})'.format(self.sorts)
+
+    def __hash__(self):
+        return hash(tuple(self.sorts))
+
+    def __eq__(self, other):
+        return super(MultipleSort, self).__eq__(other) and \
+            self.sorts == other.sorts


 class FieldSort(Sort):
    """An abstract sort criterion that orders by a specific field (of
    any kind).
    """
-    def __init__(self, field, ascending=True):
+    def __init__(self, field, ascending=True, case_insensitive=True):
        self.field = field
        self.ascending = ascending
+        self.case_insensitive = case_insensitive

    def sort(self, objs):
        # TODO: Conversion and null-detection here. In Python 3,
        # comparisons with None fail. We should also support flexible
        # attributes with different types without falling over.
-        return sorted(objs, key=attrgetter(self.field),
-                      reverse=not self.ascending)
+
+        def key(item):
+            field_val = item.get(self.field, '')
+            if self.case_insensitive and isinstance(field_val, six.text_type):
+                field_val = field_val.lower()
+            return field_val
+
+        return sorted(objs, key=key, reverse=not self.ascending)

    def __repr__(self):
-        return u'<{0}: {1}{2}>'.format(
+        return '<{0}: {1}{2}>'.format(
            type(self).__name__,
            self.field,
            '+' if self.ascending else '-',
        )

+    def __hash__(self):
+        return hash((self.field, self.ascending))
+
+    def __eq__(self, other):
+        return super(FieldSort, self).__eq__(other) and \
+            self.field == other.field and \
+            self.ascending == other.ascending
+

 class FixedFieldSort(FieldSort):
    """Sort object to sort on a fixed field.
    """
    def order_clause(self):
        order = "ASC" if self.ascending else "DESC"
-        return "{0} {1}".format(self.field, order)
+        if self.case_insensitive:
+            field = '(CASE ' \
+                    'WHEN TYPEOF({0})="text" THEN LOWER({0}) ' \
+                    'WHEN TYPEOF({0})="blob" THEN LOWER({0}) ' \
+                    'ELSE {0} END)'.format(self.field)
+        else:
+            field = self.field
+        return "{0} {1}".format(field, order)


 class SlowFieldSort(FieldSort):
@@ -650,5 +850,17 @@ class SlowFieldSort(FieldSort):

 class NullSort(Sort):
    """No sorting. Leave results unsorted."""
-    def sort(items):
+    def sort(self, items):
        return items
+
+    def __nonzero__(self):
+        return self.__bool__()
+
+    def __bool__(self):
+        return False
+
+    def __eq__(self, other):
+        return type(self) == type(other) or other is None
+
+    def __hash__(self):
+        return 0
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,13 +15,17 @@

 """Parsing of strings into DBCore queries.
 """
+from __future__ import division, absolute_import, print_function
+
 import re
 import itertools
 from . import query
-
+import beets

 PARSE_QUERY_PART_REGEX = re.compile(
    # Non-capturing optional segment for the keyword.
+    r'(-|\^)?'   # Negation prefixes.
+
    r'(?:'
    r'(\S+?)'    # The field key.
    r'(?<!\\):'  # Unescaped :
@@ -34,80 +39,124 @@ PARSE_QUERY_PART_REGEX = re.compile(

 def parse_query_part(part, query_classes={}, prefixes={},
                     default_class=query.SubstringQuery):
-    """Take a query in the form of a key/value pair separated by a
-    colon and return a tuple of `(key, value, cls)`. `key` may be None,
-    indicating that any field may be matched. `cls` is a subclass of
-    `FieldQuery`.
+    """Parse a single *query part*, which is a chunk of a complete query
+    string representing a single criterion.

-    The optional `query_classes` parameter maps field names to default
-    query types; `default_class` is the fallback. `prefixes` is a map
-    from query prefix markers and query types. Prefix-indicated queries
-    take precedence over type-based queries.
+    A query part is a string consisting of:
+    - A *pattern*: the value to look for.
+    - Optionally, a *field name* preceding the pattern, separated by a
+      colon. So in `foo:bar`, `foo` is the field name and `bar` is the
+      pattern.
+    - Optionally, a *query prefix* just before the pattern (and after the
+      optional colon) indicating the type of query that should be used. For
+      example, in `~foo`, `~` might be a prefix. (The set of prefixes to
+      look for is given in the `prefixes` parameter.)
+    - Optionally, a negation indicator, `-` or `^`, at the very beginning.

-    To determine the query class, two factors are used: prefixes and
-    field types. For example, the colon prefix denotes a regular
-    expression query and a type map might provide a special kind of
-    query for numeric values. If neither a prefix nor a specific query
-    class is available, `default_class` is used.
+    Both prefixes and the separating `:` character may be escaped with a
+    backslash to avoid their normal meaning.

-    For instance,
-    'stapler' -> (None, 'stapler', SubstringQuery)
-    'color:red' -> ('color', 'red', SubstringQuery)
-    ':^Quiet' -> (None, '^Quiet', RegexpQuery)
-    'color::b..e' -> ('color', 'b..e', RegexpQuery)
+    The function returns a tuple consisting of:
+    - The field name: a string or None if it's not present.
+    - The pattern, a string.
+    - The query class to use, which inherits from the base
+      :class:`Query` type.
+    - A negation flag, a bool.

-    Prefixes may be "escaped" with a backslash to disable the keying
-    behavior.
+    The three optional parameters determine which query class is used (i.e.,
+    the third return value). They are:
+    - `query_classes`, which maps field names to query classes. These
+      are used when no explicit prefix is present.
+    - `prefixes`, which maps prefix strings to query classes.
+    - `default_class`, the fallback when neither the field nor a prefix
+      indicates a query class.
+
+    So the precedence for determining which query class to return is:
+    prefix, followed by field, and finally the default.
+
+    For example, assuming the `:` prefix is used for `RegexpQuery`:
+    - `'stapler'` -> `(None, 'stapler', SubstringQuery, False)`
+    - `'color:red'` -> `('color', 'red', SubstringQuery, False)`
+    - `':^Quiet'` -> `(None, '^Quiet', RegexpQuery, False)`, because
+      the `^` follows the `:`
+    - `'color::b..e'` -> `('color', 'b..e', RegexpQuery, False)`
+    - `'-color:red'` -> `('color', 'red', SubstringQuery, True)`
    """
+    # Apply the regular expression and extract the components.
    part = part.strip()
    match = PARSE_QUERY_PART_REGEX.match(part)

-    assert match  # Regex should always match.
-    key = match.group(1)
-    term = match.group(2).replace('\:', ':')
+    assert match  # Regex should always match
+    negate = bool(match.group(1))
+    key = match.group(2)
+    term = match.group(3).replace('\:', ':')

-    # Match the search term against the list of prefixes.
+    # Check whether there's a prefix in the query and use the
+    # corresponding query type.
    for pre, query_class in prefixes.items():
        if term.startswith(pre):
-            return key, term[len(pre):], query_class
+            return key, term[len(pre):], query_class, negate

-    # No matching prefix: use type-based or fallback/default query.
+    # No matching prefix, so use either the query class determined by
+    # the field or the default as a fallback.
    query_class = query_classes.get(key, default_class)
-    return key, term, query_class
+    return key, term, query_class, negate


 def construct_query_part(model_cls, prefixes, query_part):
-    """Create a query from a single query component, `query_part`, for
-    querying instances of `model_cls`. Return a `Query` instance.
+    """Parse a *query part* string and return a :class:`Query` object.
+
+    :param model_cls: The :class:`Model` class that this is a query for.
+      This is used to determine the appropriate query types for the
+      model's fields.
+    :param prefixes: A map from prefix strings to :class:`Query` types.
+    :param query_part: The string to parse.
+
+    See the documentation for `parse_query_part` for more information on
+    query part syntax.
    """
-    # Shortcut for empty query parts.
+    # A shortcut for empty query parts.
    if not query_part:
        return query.TrueQuery()

-    # Get the query classes for each possible field.
+    # Use `model_cls` to build up a map from field names to `Query`
+    # classes.
    query_classes = {}
    for k, t in itertools.chain(model_cls._fields.items(),
                                model_cls._types.items()):
        query_classes[k] = t.query

    # Parse the string.
-    key, pattern, query_class = \
+    key, pattern, query_class, negate = \
        parse_query_part(query_part, query_classes, prefixes)

-    # No key specified.
+    # If there's no key (field name) specified, this is a "match
+    # anything" query.
    if key is None:
        if issubclass(query_class, query.FieldQuery):
            # The query type matches a specific field, but none was
            # specified. So we use a version of the query that matches
            # any field.
-            return query.AnyFieldQuery(pattern, model_cls._search_fields,
-                                       query_class)
+            q = query.AnyFieldQuery(pattern, model_cls._search_fields,
+                                    query_class)
+            if negate:
+                return query.NotQuery(q)
+            else:
+                return q
        else:
-            # Other query type.
-            return query_class(pattern)
+            # Non-field query type.
+            if negate:
+                return query.NotQuery(query_class(pattern))
+            else:
+                return query_class(pattern)

+    # Otherwise, this must be a `FieldQuery`. Use the field name to
+    # construct the query object.
    key = key.lower()
-    return query_class(key.lower(), pattern, key in model_cls._fields)
+    q = query_class(key.lower(), pattern, key in model_cls._fields)
+    if negate:
+        return query.NotQuery(q)
+    return q


 def query_from_strings(query_cls, model_cls, prefixes, query_parts):
@@ -136,13 +185,15 @@ def construct_sort_part(model_cls, part):
    assert direction in ('+', '-'), "part must end with + or -"
    is_ascending = direction == '+'

+    case_insensitive = beets.config['sort_case_insensitive'].get(bool)
    if field in model_cls._sorts:
-        sort = model_cls._sorts[field](model_cls, is_ascending)
+        sort = model_cls._sorts[field](model_cls, is_ascending,
+                                       case_insensitive)
    elif field in model_cls._fields:
-        sort = query.FixedFieldSort(field, is_ascending)
+        sort = query.FixedFieldSort(field, is_ascending, case_insensitive)
    else:
        # Flexible or computed.
-        sort = query.SlowFieldSort(field, is_ascending)
+        sort = query.SlowFieldSort(field, is_ascending, case_insensitive)
    return sort


@@ -150,31 +201,50 @@ def sort_from_strings(model_cls, sort_parts):
    """Create a `Sort` from a list of sort criteria (strings).
    """
    if not sort_parts:
-        return query.NullSort()
+        sort = query.NullSort()
+    elif len(sort_parts) == 1:
+        sort = construct_sort_part(model_cls, sort_parts[0])
    else:
        sort = query.MultipleSort()
        for part in sort_parts:
            sort.add_sort(construct_sort_part(model_cls, part))
-        return sort
+    return sort


-def parse_sorted_query(model_cls, parts, prefixes={},
-                       query_cls=query.AndQuery):
+def parse_sorted_query(model_cls, parts, prefixes={}):
    """Given a list of strings, create the `Query` and `Sort` that they
    represent.
    """
    # Separate query token and sort token.
    query_parts = []
    sort_parts = []
-    for part in parts:
-        if part.endswith((u'+', u'-')) and u':' not in part:
-            sort_parts.append(part)
-        else:
-            query_parts.append(part)

-    # Parse each.
-    q = query_from_strings(
-        query_cls, model_cls, prefixes, query_parts
-    )
+    # Split up query in to comma-separated subqueries, each representing
+    # an AndQuery, which need to be joined together in one OrQuery
+    subquery_parts = []
+    for part in parts + [u',']:
+        if part.endswith(u','):
+            # Ensure we can catch "foo, bar" as well as "foo , bar"
+            last_subquery_part = part[:-1]
+            if last_subquery_part:
+                subquery_parts.append(last_subquery_part)
+            # Parse the subquery in to a single AndQuery
+            # TODO: Avoid needlessly wrapping AndQueries containing 1 subquery?
+            query_parts.append(query_from_strings(
+                query.AndQuery, model_cls, prefixes, subquery_parts
+            ))
+            del subquery_parts[:]
+        else:
+            # Sort parts (1) end in + or -, (2) don't have a field, and
+            # (3) consist of more than just the + or -.
+            if part.endswith((u'+', u'-')) \
+                    and u':' not in part \
+                    and len(part) > 1:
+                sort_parts.append(part)
+            else:
+                subquery_parts.append(part)
+
+    # Avoid needlessly wrapping single statements in an OR
+    q = query.OrQuery(query_parts) if len(query_parts) > 1 else query_parts[0]
    s = sort_from_strings(model_cls, sort_parts)
    return q, s
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,8 +15,14 @@

 """Representation of type information for DBCore model fields.
 """
+from __future__ import division, absolute_import, print_function
+
 from . import query
 from beets.util import str2bool
+import six
+
+if not six.PY2:
+    buffer = memoryview  # sqlite won't accept memoryview in python 2


 # Abstract base.
@@ -34,7 +41,7 @@ class Type(object):
    """The `Query` subclass to be used when querying the field.
    """

-    model_type = unicode
+    model_type = six.text_type
    """The Python type that is used to represent the value in the model.

    The model is guaranteed to return a value of this type if the field
@@ -58,9 +65,9 @@ class Type(object):
        if value is None:
            value = u''
        if isinstance(value, bytes):
-            value = value.decode('utf8', 'ignore')
+            value = value.decode('utf-8', 'ignore')

-        return unicode(value)
+        return six.text_type(value)

    def parse(self, string):
        """Parse a (possibly human-written) string and return the
@@ -93,13 +100,13 @@ class Type(object):
        http://www.sqlite.org/datatype3.html
        https://docs.python.org/2/library/sqlite3.html#sqlite-and-python-types

-        Flexible fields have the type afinity `TEXT`. This means the
-        `sql_value` is either a `buffer` or a `unicode` object` and the
-        method must handle these in addition.
+        Flexible fields have the type affinity `TEXT`. This means the
+        `sql_value` is either a `buffer`/`memoryview` or a `unicode` object`
+        and the method must handle these in addition.
        """
        if isinstance(sql_value, buffer):
-            sql_value = bytes(sql_value).decode('utf8', 'ignore')
-        if isinstance(sql_value, unicode):
+            sql_value = bytes(sql_value).decode('utf-8', 'ignore')
+        if isinstance(sql_value, six.text_type):
            return self.parse(sql_value)
        else:
            return self.normalize(sql_value)
@@ -191,7 +198,7 @@ class Boolean(Type):
    model_type = bool

    def format(self, value):
-        return unicode(bool(value))
+        return six.text_type(bool(value))

    def parse(self, string):
        return str2bool(string)
@@ -0,0 +1,134 @@
+# -*- coding: utf-8 -*-
+# This file is part of beets.
+# Copyright 2016, Adrian Sampson.
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+"""A drop-in replacement for the standard-library `logging` module that
+allows {}-style log formatting on Python 2 and 3.
+
+Provides everything the "logging" module does. The only difference is
+that when getLogger(name) instantiates a logger that logger uses
+{}-style formatting.
+"""
+
+from __future__ import division, absolute_import, print_function
+
+from copy import copy
+from logging import *  # noqa
+import subprocess
+import threading
+import six
+
+
+def logsafe(val):
+    """Coerce a potentially "problematic" value so it can be formatted
+    in a Unicode log string.
+
+    This works around a number of pitfalls when logging objects in
+    Python 2:
+    - Logging path names, which must be byte strings, requires
+      conversion for output.
+    - Some objects, including some exceptions, will crash when you call
+      `unicode(v)` while `str(v)` works fine. CalledProcessError is an
+      example.
+    """
+    # Already Unicode.
+    if isinstance(val, six.text_type):
+        return val
+
+    # Bytestring: needs decoding.
+    elif isinstance(val, bytes):
+        # Blindly convert with UTF-8. Eventually, it would be nice to
+        # (a) only do this for paths, if they can be given a distinct
+        # type, and (b) warn the developer if they do this for other
+        # bytestrings.
+        return val.decode('utf-8', 'replace')
+
+    # A "problem" object: needs a workaround.
+    elif isinstance(val, subprocess.CalledProcessError):
+        try:
+            return six.text_type(val)
+        except UnicodeDecodeError:
+            # An object with a broken __unicode__ formatter. Use __str__
+            # instead.
+            return str(val).decode('utf-8', 'replace')
+
+    # Other objects are used as-is so field access, etc., still works in
+    # the format string.
+    else:
+        return val
+
+
+class StrFormatLogger(Logger):
+    """A version of `Logger` that uses `str.format`-style formatting
+    instead of %-style formatting.
+    """
+
+    class _LogMessage(object):
+        def __init__(self, msg, args, kwargs):
+            self.msg = msg
+            self.args = args
+            self.kwargs = kwargs
+
+        def __str__(self):
+            args = [logsafe(a) for a in self.args]
+            kwargs = dict((k, logsafe(v)) for (k, v) in self.kwargs.items())
+            return self.msg.format(*args, **kwargs)
+
+    def _log(self, level, msg, args, exc_info=None, extra=None, **kwargs):
+        """Log msg.format(*args, **kwargs)"""
+        m = self._LogMessage(msg, args, kwargs)
+        return super(StrFormatLogger, self)._log(level, m, (), exc_info, extra)
+
+
+class ThreadLocalLevelLogger(Logger):
+    """A version of `Logger` whose level is thread-local instead of shared.
+    """
+    def __init__(self, name, level=NOTSET):
+        self._thread_level = threading.local()
+        self.default_level = NOTSET
+        super(ThreadLocalLevelLogger, self).__init__(name, level)
+
+    @property
+    def level(self):
+        try:
+            return self._thread_level.level
+        except AttributeError:
+            self._thread_level.level = self.default_level
+            return self.level
+
+    @level.setter
+    def level(self, value):
+        self._thread_level.level = value
+
+    def set_global_level(self, level):
+        """Set the level on the current thread + the default value for all
+        threads.
+        """
+        self.default_level = level
+        self.setLevel(level)
+
+
+class BeetsLogger(ThreadLocalLevelLogger, StrFormatLogger):
+    pass
+
+
+my_manager = copy(Logger.manager)
+my_manager.loggerClass = BeetsLogger
+
+
+def getLogger(name=None):  # noqa
+    if name:
+        return my_manager.getLogger(name)
+    else:
+        return Logger.root
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,15 +15,19 @@

 """Support for beets plugins."""

-import logging
-import traceback
+from __future__ import division, absolute_import, print_function
+
 import inspect
+import traceback
 import re
 from collections import defaultdict
+from functools import wraps


 import beets
+from beets import logging
 from beets import mediafile
+import six

 PLUGIN_NAMESPACE = 'beetsplug'

@@ -41,6 +46,23 @@ class PluginConflictException(Exception):
    """


+class PluginLogFilter(logging.Filter):
+    """A logging filter that identifies the plugin that emitted a log
+    message.
+    """
+    def __init__(self, plugin):
+        self.prefix = u'{0}: '.format(plugin.name)
+
+    def filter(self, record):
+        if hasattr(record.msg, 'msg') and isinstance(record.msg.msg,
+                                                     six.string_types):
+            # A _LogMessage from our hacked-up Logging replacement.
+            record.msg.msg = self.prefix + record.msg.msg
+        elif isinstance(record.msg, six.string_types):
+            record.msg = self.prefix + record.msg
+        return True
+
+
 # Managing the plugins themselves.

 class BeetsPlugin(object):
@@ -51,7 +73,6 @@ class BeetsPlugin(object):
    def __init__(self, name=None):
        """Perform one-time plugin setup.
        """
-        self.import_stages = []
        self.name = name or self.__module__.split('.')[-1]
        self.config = beets.config[self.name]
        if not self.template_funcs:
@@ -60,6 +81,12 @@ class BeetsPlugin(object):
            self.template_fields = {}
        if not self.album_template_fields:
            self.album_template_fields = {}
+        self.import_stages = []
+
+        self._log = log.getChild(self.name)
+        self._log.setLevel(logging.NOTSET)  # Use `beets` logger level.
+        if not any(isinstance(f, PluginLogFilter) for f in self._log.filters):
+            self._log.addFilter(PluginLogFilter(self))

    def commands(self):
        """Should return a list of beets.ui.Subcommand objects for
@@ -67,6 +94,46 @@ class BeetsPlugin(object):
        """
        return ()

+    def get_import_stages(self):
+        """Return a list of functions that should be called as importer
+        pipelines stages.
+
+        The callables are wrapped versions of the functions in
+        `self.import_stages`. Wrapping provides some bookkeeping for the
+        plugin: specifically, the logging level is adjusted to WARNING.
+        """
+        return [self._set_log_level_and_params(logging.WARNING, import_stage)
+                for import_stage in self.import_stages]
+
+    def _set_log_level_and_params(self, base_log_level, func):
+        """Wrap `func` to temporarily set this plugin's logger level to
+        `base_log_level` + config options (and restore it to its previous
+        value after the function returns). Also determines which params may not
+        be sent for backwards-compatibility.
+        """
+        argspec = inspect.getargspec(func)
+
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            assert self._log.level == logging.NOTSET
+            verbosity = beets.config['verbose'].get(int)
+            log_level = max(logging.DEBUG, base_log_level - 10 * verbosity)
+            self._log.setLevel(log_level)
+            try:
+                try:
+                    return func(*args, **kwargs)
+                except TypeError as exc:
+                    if exc.args[0].startswith(func.__name__):
+                        # caused by 'func' and not stuff internal to 'func'
+                        kwargs = dict((arg, val) for arg, val in kwargs.items()
+                                      if arg in argspec.args)
+                        return func(*args, **kwargs)
+                    else:
+                        raise
+            finally:
+                self._log.setLevel(logging.NOTSET)
+        return wrapper
+
    def queries(self):
        """Should return a dict mapping prefixes to Query subclasses.
        """
@@ -123,37 +190,21 @@ class BeetsPlugin(object):
        mediafile.MediaFile.add_field(name, descriptor)
        library.Item._media_fields.add(name)

+    _raw_listeners = None
    listeners = None

-    @classmethod
-    def register_listener(cls, event, func):
-        """Add a function as a listener for the specified event. (An
-        imperative alternative to the @listen decorator.)
+    def register_listener(self, event, func):
+        """Add a function as a listener for the specified event.
        """
-        if cls.listeners is None:
+        wrapped_func = self._set_log_level_and_params(logging.WARNING, func)
+
+        cls = self.__class__
+        if cls.listeners is None or cls._raw_listeners is None:
+            cls._raw_listeners = defaultdict(list)
            cls.listeners = defaultdict(list)
-        cls.listeners[event].append(func)
-
-    @classmethod
-    def listen(cls, event):
-        """Decorator that adds a function as an event handler for the
-        specified event (as a string). The parameters passed to function
-        will vary depending on what event occurred.
-
-        The function should respond to named parameters.
-        function(**kwargs) will trap all arguments in a dictionary.
-        Example:
-
-            >>> @MyPlugin.listen("imported")
-            >>> def importListener(**kwargs):
-            ...     pass
-        """
-        def helper(func):
-            if cls.listeners is None:
-                cls.listeners = defaultdict(list)
-            cls.listeners[event].append(func)
-            return func
-        return helper
+        if func not in cls._raw_listeners[event]:
+            cls._raw_listeners[event].append(func)
+            cls.listeners[event].append(wrapped_func)

    template_funcs = None
    template_fields = None
@@ -197,14 +248,14 @@ def load_plugins(names=()):
    BeetsPlugin subclasses desired.
    """
    for name in names:
-        modname = '%s.%s' % (PLUGIN_NAMESPACE, name)
+        modname = '{0}.{1}'.format(PLUGIN_NAMESPACE, name)
        try:
            try:
                namespace = __import__(modname, None, None)
            except ImportError as exc:
                # Again, this is hacky:
                if exc.args[0].endswith(' ' + name):
-                    log.warn(u'** plugin {0} not found'.format(name))
+                    log.warning(u'** plugin {0} not found', name)
                else:
                    raise
            else:
@@ -214,8 +265,11 @@ def load_plugins(names=()):
                        _classes.add(obj)

        except:
-            log.warn(u'** error loading plugin {0}'.format(name))
-            log.warn(traceback.format_exc())
+            log.warning(
+                u'** error loading plugin {}:\n{}',
+                name,
+                traceback.format_exc(),
+            )


 _instances = {}
@@ -267,8 +321,8 @@ def types(model_cls):
            if field in types and plugin_types[field] != types[field]:
                raise PluginConflictException(
                    u'Plugin {0} defines flexible field {1} '
-                    'which has already been defined with '
-                    'another type.'.format(plugin.name, field)
+                    u'which has already been defined with '
+                    u'another type.'.format(plugin.name, field)
                )
        types.update(plugin_types)
    return types
@@ -297,41 +351,35 @@ def album_distance(items, album_info, mapping):
 def candidates(items, artist, album, va_likely):
    """Gets MusicBrainz candidates for an album from each plugin.
    """
-    out = []
    for plugin in find_plugins():
-        out.extend(plugin.candidates(items, artist, album, va_likely))
-    return out
+        for candidate in plugin.candidates(items, artist, album, va_likely):
+            yield candidate


 def item_candidates(item, artist, title):
    """Gets MusicBrainz candidates for an item from the plugins.
    """
-    out = []
    for plugin in find_plugins():
-        out.extend(plugin.item_candidates(item, artist, title))
-    return out
+        for item_candidate in plugin.item_candidates(item, artist, title):
+            yield item_candidate


 def album_for_id(album_id):
    """Get AlbumInfo objects for a given ID string.
    """
-    out = []
    for plugin in find_plugins():
-        res = plugin.album_for_id(album_id)
-        if res:
-            out.append(res)
-    return out
+        album = plugin.album_for_id(album_id)
+        if album:
+            yield album


 def track_for_id(track_id):
    """Get TrackInfo objects for a given ID string.
    """
-    out = []
    for plugin in find_plugins():
-        res = plugin.track_for_id(track_id)
-        if res:
-            out.append(res)
-    return out
+        track = plugin.track_for_id(track_id)
+        if track:
+            yield track


 def template_funcs():
@@ -349,8 +397,7 @@ def import_stages():
    """Get a list of import stage functions defined by plugins."""
    stages = []
    for plugin in find_plugins():
-        if hasattr(plugin, 'import_stages'):
-            stages += plugin.import_stages
+        stages += plugin.get_import_stages()
    return stages


@@ -392,18 +439,20 @@ def event_handlers():


 def send(event, **arguments):
-    """Sends an event to all assigned event listeners. Event is the
-    name of  the event to send, all other named arguments go to the
-    event handler(s).
+    """Send an event to all assigned event listeners.

-    Returns a list of return values from the handlers.
+    `event` is the name of  the event to send, all other named arguments
+    are passed along to the handlers.
+
+    Return a list of non-None values returned from the handlers.
    """
-    log.debug(u'Sending event: {0}'.format(event))
+    log.debug(u'Sending event: {0}', event)
+    results = []
    for handler in event_handlers()[event]:
-        # Don't break legacy plugins if we want to pass more arguments
-        argspec = inspect.getargspec(handler).args
-        args = dict((k, v) for k, v in arguments.items() if k in argspec)
-        handler(**args)
+        result = handler(**arguments)
+        if result is not None:
+            results.append(result)
+    return results


 def feat_tokens(for_artist=True):
@@ -433,3 +482,19 @@ def sanitize_choices(choices, choices_all):
            if not (s in seen or seen.add(s)):
                res.extend(list(others) if s == '*' else [s])
    return res
+
+
+def notify_info_yielded(event):
+    """Makes a generator send the event 'event' every time it yields.
+    This decorator is supposed to decorate a generator, but any function
+    returning an iterable should work.
+    Each yielded value is passed to plugins using the 'info' parameter of
+    'send'.
+    """
+    def decorator(generator):
+        def decorated(*args, **kwargs):
+            for v in generator(*args, **kwargs):
+                send(event, info=v)
+                yield v
+        return decorated
+    return decorator
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -16,28 +17,31 @@
 interface. To invoke the CLI, just call beets.ui.main(). The actual
 CLI commands are implemented in the ui.commands module.
 """
-from __future__ import print_function

-import locale
+from __future__ import division, absolute_import, print_function
+
 import optparse
 import textwrap
 import sys
 from difflib import SequenceMatcher
-import logging
 import sqlite3
 import errno
 import re
 import struct
 import traceback
 import os.path
+from six.moves import input

+from beets import logging
 from beets import library
 from beets import plugins
 from beets import util
 from beets.util.functemplate import Template
 from beets import config
-from beets.util import confit
+from beets.util import confit, as_string
 from beets.autotag import mb
+from beets.dbcore import query as db_query
+import six

 # On Windows platforms, use colorama to support "ANSI" terminal colors.
 if sys.platform == 'win32':
@@ -56,8 +60,8 @@ log.propagate = False  # Don't propagate to root handler.


 PF_KEY_QUERIES = {
-    'comp': 'comp:true',
-    'singleton': 'singleton:true',
+    'comp': u'comp:true',
+    'singleton': u'singleton:true',
 }


@@ -67,68 +71,149 @@ class UserError(Exception):
    """


-# Utilities.
+# Encoding utilities.

-def _encoding():
-    """Tries to guess the encoding used by the terminal."""
+
+def _in_encoding():
+    """Get the encoding to use for *inputting* strings from the console.
+    """
+    return _stream_encoding(sys.stdin)
+
+
+def _out_encoding():
+    """Get the encoding to use for *outputting* strings to the console.
+    """
+    return _stream_encoding(sys.stdout)
+
+
+def _stream_encoding(stream, default='utf-8'):
+    """A helper for `_in_encoding` and `_out_encoding`: get the stream's
+    preferred encoding, using a configured override or a default
+    fallback if neither is not specified.
+    """
    # Configured override?
    encoding = config['terminal_encoding'].get()
    if encoding:
        return encoding

-    # Determine from locale settings.
-    try:
-        return locale.getdefaultlocale()[1] or 'utf8'
-    except ValueError:
-        # Invalid locale environment variable setting. To avoid
-        # failing entirely for no good reason, assume UTF-8.
-        return 'utf8'
+    # For testing: When sys.stdout or sys.stdin is a StringIO under the
+    # test harness, it doesn't have an `encoding` attribute. Just use
+    # UTF-8.
+    if not hasattr(stream, 'encoding'):
+        return default
+
+    # Python's guessed output stream encoding, or UTF-8 as a fallback
+    # (e.g., when piped to a file).
+    return stream.encoding or default


 def decargs(arglist):
    """Given a list of command-line argument bytestrings, attempts to
-    decode them to Unicode strings.
+    decode them to Unicode strings when running under Python 2.
    """
-    return [s.decode(_encoding()) for s in arglist]
+    if six.PY2:
+        return [s.decode(util.arg_encoding()) for s in arglist]
+    else:
+        return arglist


-def print_(*strings):
+def print_(*strings, **kwargs):
    """Like print, but rather than raising an error when a character
    is not in the terminal's encoding's character set, just silently
    replaces it.
-    """
-    if strings:
-        if isinstance(strings[0], unicode):
-            txt = u' '.join(strings)
-        else:
-            txt = ' '.join(strings)
-    else:
-        txt = u''
-    if isinstance(txt, unicode):
-        txt = txt.encode(_encoding(), 'replace')
-    print(txt)

+    The arguments must be Unicode strings: `unicode` on Python 2; `str` on
+    Python 3.
+
+    The `end` keyword argument behaves similarly to the built-in `print`
+    (it defaults to a newline).
+    """
+    if not strings:
+        strings = [u'']
+    assert isinstance(strings[0], six.text_type)
+
+    txt = u' '.join(strings)
+    txt += kwargs.get('end', u'\n')
+
+    # Encode the string and write it to stdout.
+    if six.PY2:
+        # On Python 2, sys.stdout expects bytes.
+        out = txt.encode(_out_encoding(), 'replace')
+        sys.stdout.write(out)
+    else:
+        # On Python 3, sys.stdout expects text strings and uses the
+        # exception-throwing encoding error policy. To avoid throwing
+        # errors and use our configurable encoding override, we use the
+        # underlying bytes buffer instead.
+        if hasattr(sys.stdout, 'buffer'):
+            out = txt.encode(_out_encoding(), 'replace')
+            sys.stdout.buffer.write(out)
+        else:
+            # In our test harnesses (e.g., DummyOut), sys.stdout.buffer
+            # does not exist. We instead just record the text string.
+            sys.stdout.write(txt)
+
+
+# Configuration wrappers.
+
+def _bool_fallback(a, b):
+    """Given a boolean or None, return the original value or a fallback.
+    """
+    if a is None:
+        assert isinstance(b, bool)
+        return b
+    else:
+        assert isinstance(a, bool)
+        return a
+
+
+def should_write(write_opt=None):
+    """Decide whether a command that updates metadata should also write
+    tags, using the importer configuration as the default.
+    """
+    return _bool_fallback(write_opt, config['import']['write'].get(bool))
+
+
+def should_move(move_opt=None):
+    """Decide whether a command that updates metadata should also move
+    files when they're inside the library, using the importer
+    configuration as the default.
+
+    Specifically, commands should move files after metadata updates only
+    when the importer is configured *either* to move *or* to copy files.
+    They should avoid moving files when the importer is configured not
+    to touch any filenames.
+    """
+    return _bool_fallback(
+        move_opt,
+        config['import']['move'].get(bool) or
+        config['import']['copy'].get(bool)
+    )
+
+
+# Input prompts.

 def input_(prompt=None):
-    """Like `raw_input`, but decodes the result to a Unicode string.
+    """Like `input`, but decodes the result to a Unicode string.
    Raises a UserError if stdin is not available. The prompt is sent to
    stdout rather than stderr. A printed between the prompt and the
    input cursor.
    """
    # raw_input incorrectly sends prompts to stderr, not stdout, so we
-    # use print() explicitly to display prompts.
+    # use print_() explicitly to display prompts.
    # http://bugs.python.org/issue1927
    if prompt:
-        if isinstance(prompt, unicode):
-            prompt = prompt.encode(_encoding(), 'replace')
-        print(prompt, end=' ')
+        print_(prompt, end=u' ')

    try:
-        resp = raw_input()
+        resp = input()
    except EOFError:
-        raise UserError('stdin stream ended while input required')
+        raise UserError(u'stdin stream ended while input required')

-    return resp.decode(sys.stdin.encoding or 'utf8', 'ignore')
+    if six.PY2:
+        return resp.decode(_in_encoding(), 'ignore')
+    else:
+        return resp


 def input_options(options, require=False, prompt=None, fallback_prompt=None,
@@ -172,7 +257,7 @@ def input_options(options, require=False, prompt=None, fallback_prompt=None,
                    found_letter = letter
                    break
            else:
-                raise ValueError('no unambiguous lettering found')
+                raise ValueError(u'no unambiguous lettering found')

        letters[found_letter.lower()] = option
        index = option.index(found_letter)
@@ -180,7 +265,7 @@ def input_options(options, require=False, prompt=None, fallback_prompt=None,
        # Mark the option's shortcut letter for display.
        if not require and (
            (default is None and not numrange and first) or
-            (isinstance(default, basestring) and
+            (isinstance(default, six.string_types) and
             found_letter.lower() == default.lower())):
            # The first option is the default; mark it.
            show_letter = '[%s]' % found_letter.upper()
@@ -190,7 +275,7 @@ def input_options(options, require=False, prompt=None, fallback_prompt=None,
            is_default = False

        # Colorize the letter shortcut.
-        show_letter = colorize('turquoise' if is_default else 'blue',
+        show_letter = colorize('action_default' if is_default else 'action',
                               show_letter)

        # Insert the highlighted letter back into the word.
@@ -216,11 +301,11 @@ def input_options(options, require=False, prompt=None, fallback_prompt=None,
        prompt_part_lengths = []
        if numrange:
            if isinstance(default, int):
-                default_name = str(default)
-                default_name = colorize('turquoise', default_name)
+                default_name = six.text_type(default)
+                default_name = colorize('action_default', default_name)
                tmpl = '# selection (default %s)'
                prompt_parts.append(tmpl % default_name)
-                prompt_part_lengths.append(len(tmpl % str(default)))
+                prompt_part_lengths.append(len(tmpl % six.text_type(default)))
            else:
                prompt_parts.append('# selection')
                prompt_part_lengths.append(len(prompt_parts[-1]))
@@ -255,9 +340,9 @@ def input_options(options, require=False, prompt=None, fallback_prompt=None,
    # Make a fallback prompt too. This is displayed if the user enters
    # something that is not recognized.
    if not fallback_prompt:
-        fallback_prompt = 'Enter one of '
+        fallback_prompt = u'Enter one of '
        if numrange:
-            fallback_prompt += '%i-%i, ' % numrange
+            fallback_prompt += u'%i-%i, ' % numrange
        fallback_prompt += ', '.join(display_letters) + ':'

    resp = input_(prompt)
@@ -296,19 +381,52 @@ def input_yn(prompt, require=False):
    "yes" unless `require` is `True`, in which case there is no default.
    """
    sel = input_options(
-        ('y', 'n'), require, prompt, 'Enter Y or N:'
+        ('y', 'n'), require, prompt, u'Enter Y or N:'
    )
-    return sel == 'y'
+    return sel == u'y'


+def input_select_objects(prompt, objs, rep):
+    """Prompt to user to choose all, none, or some of the given objects.
+    Return the list of selected objects.
+
+    `prompt` is the prompt string to use for each question (it should be
+    phrased as an imperative verb). `rep` is a function to call on each
+    object to print it out when confirming objects individually.
+    """
+    choice = input_options(
+        (u'y', u'n', u's'), False,
+        u'%s? (Yes/no/select)' % prompt)
+    print()  # Blank line.
+
+    if choice == u'y':  # Yes.
+        return objs
+
+    elif choice == u's':  # Select.
+        out = []
+        for obj in objs:
+            rep(obj)
+            if input_yn(u'%s? (yes/no)' % prompt, True):
+                out.append(obj)
+            print()  # go to a new line
+        return out
+
+    else:  # No.
+        return []
+
+
+# Human output formatting.
+
 def human_bytes(size):
    """Formats size, a number of bytes, in a human-readable way."""
-    suffices = ['B', 'KB', 'MB', 'GB', 'TB', 'PB', 'EB', 'ZB', 'YB', 'HB']
-    for suffix in suffices:
+    powers = [u'', u'K', u'M', u'G', u'T', u'P', u'E', u'Z', u'Y', u'H']
+    unit = 'B'
+    for power in powers:
        if size < 1024:
-            return "%3.1f %s" % (size, suffix)
+            return u"%3.1f %s%s" % (size, power, unit)
        size /= 1024.0
-    return "big"
+        unit = u'iB'
+    return u"big"


 def human_seconds(interval):
@@ -316,13 +434,13 @@ def human_seconds(interval):
    interval using English words.
    """
    units = [
-        (1, 'second'),
-        (60, 'minute'),
-        (60, 'hour'),
-        (24, 'day'),
-        (7, 'week'),
-        (52, 'year'),
-        (10, 'decade'),
+        (1, u'second'),
+        (60, u'minute'),
+        (60, u'hour'),
+        (24, u'day'),
+        (7, u'week'),
+        (52, u'year'),
+        (10, u'decade'),
    ]
    for i in range(len(units) - 1):
        increment, suffix = units[i]
@@ -335,7 +453,7 @@ def human_seconds(interval):
        increment, suffix = units[-1]
        interval /= float(increment)

-    return "%3.1f %ss" % (interval, suffix)
+    return u"%3.1f %ss" % (interval, suffix)


 def human_seconds_short(interval):
@@ -346,16 +464,45 @@ def human_seconds_short(interval):
    return u'%i:%02i' % (interval // 60, interval % 60)


+# Colorization.
+
 # ANSI terminal colorization code heavily inspired by pygments:
 # http://dev.pocoo.org/hg/pygments-main/file/b2deea5b5030/pygments/console.py
 # (pygments is by Tim Hatch, Armin Ronacher, et al.)
 COLOR_ESCAPE = "\x1b["
-DARK_COLORS = ["black", "darkred", "darkgreen", "brown", "darkblue",
-               "purple", "teal", "lightgray"]
-LIGHT_COLORS = ["darkgray", "red", "green", "yellow", "blue",
-                "fuchsia", "turquoise", "white"]
+DARK_COLORS = {
+    "black": 0,
+    "darkred": 1,
+    "darkgreen": 2,
+    "brown": 3,
+    "darkyellow": 3,
+    "darkblue": 4,
+    "purple": 5,
+    "darkmagenta": 5,
+    "teal": 6,
+    "darkcyan": 6,
+    "lightgray": 7
+}
+LIGHT_COLORS = {
+    "darkgray": 0,
+    "red": 1,
+    "green": 2,
+    "yellow": 3,
+    "blue": 4,
+    "fuchsia": 5,
+    "magenta": 5,
+    "turquoise": 6,
+    "cyan": 6,
+    "white": 7
+}
 RESET_COLOR = COLOR_ESCAPE + "39;49;00m"

+# These abstract COLOR_NAMES are lazily mapped on to the actual color in COLORS
+# as they are defined in the configuration files, see function: colorize
+COLOR_NAMES = ['text_success', 'text_warning', 'text_error', 'text_highlight',
+               'text_highlight_minor', 'action_default', 'action']
+COLORS = None
+

 def _colorize(color, text):
    """Returns a string that prints the given text in the given color
@@ -363,34 +510,47 @@ def _colorize(color, text):
    in DARK_COLORS or LIGHT_COLORS.
    """
    if color in DARK_COLORS:
-        escape = COLOR_ESCAPE + "%im" % (DARK_COLORS.index(color) + 30)
+        escape = COLOR_ESCAPE + "%im" % (DARK_COLORS[color] + 30)
    elif color in LIGHT_COLORS:
-        escape = COLOR_ESCAPE + "%i;01m" % (LIGHT_COLORS.index(color) + 30)
+        escape = COLOR_ESCAPE + "%i;01m" % (LIGHT_COLORS[color] + 30)
    else:
-        raise ValueError('no such color %s', color)
+        raise ValueError(u'no such color %s', color)
    return escape + text + RESET_COLOR


-def colorize(color, text):
+def colorize(color_name, text):
    """Colorize text if colored output is enabled. (Like _colorize but
    conditional.)
    """
-    if config['color']:
+    if config['ui']['color']:
+        global COLORS
+        if not COLORS:
+            COLORS = dict((name,
+                           config['ui']['colors'][name].as_str())
+                          for name in COLOR_NAMES)
+        # In case a 3rd party plugin is still passing the actual color ('red')
+        # instead of the abstract color name ('text_error')
+        color = COLORS.get(color_name)
+        if not color:
+            log.debug(u'Invalid color_name: {0}', color_name)
+            color = color_name
        return _colorize(color, text)
    else:
        return text


-def _colordiff(a, b, highlight='red', minor_highlight='lightgray'):
+def _colordiff(a, b, highlight='text_highlight',
+               minor_highlight='text_highlight_minor'):
    """Given two values, return the same pair of strings except with
    their differences highlighted in the specified color. Strings are
    highlighted intelligently to show differences; other values are
    stringified and highlighted in their entirety.
    """
-    if not isinstance(a, basestring) or not isinstance(b, basestring):
+    if not isinstance(a, six.string_types) \
+       or not isinstance(b, six.string_types):
        # Non-strings: use ordinary equality.
-        a = unicode(a)
-        b = unicode(b)
+        a = six.text_type(a)
+        b = six.text_type(b)
        if a == b:
            return a, b
        else:
@@ -431,14 +591,14 @@ def _colordiff(a, b, highlight='red', minor_highlight='lightgray'):
    return u''.join(a_out), u''.join(b_out)


-def colordiff(a, b, highlight='red'):
+def colordiff(a, b, highlight='text_highlight'):
    """Colorize differences between two values if color is enabled.
    (Like _colordiff but conditional.)
    """
-    if config['color']:
+    if config['ui']['color']:
        return _colordiff(a, b, highlight)
    else:
-        return unicode(a), unicode(b)
+        return six.text_type(a), six.text_type(b)


 def get_path_formats(subview=None):
@@ -449,7 +609,7 @@ def get_path_formats(subview=None):
    subview = subview or config['paths']
    for query, view in subview.items():
        query = PF_KEY_QUERIES.get(query, query)  # Expand common queries.
-        path_formats.append((query, Template(view.get(unicode))))
+        path_formats.append((query, Template(view.as_str())))
    return path_formats


@@ -470,31 +630,6 @@ def get_replacements():
    return replacements


-def _pick_format(album, fmt=None):
-    """Pick a format string for printing Album or Item objects,
-    falling back to config options and defaults.
-    """
-    if fmt:
-        return fmt
-    if album:
-        return config['list_format_album'].get(unicode)
-    else:
-        return config['list_format_item'].get(unicode)
-
-
-def print_obj(obj, lib, fmt=None):
-    """Print an Album or Item object. If `fmt` is specified, use that
-    format string. Otherwise, use the configured template.
-    """
-    album = isinstance(obj, library.Album)
-    fmt = _pick_format(album, fmt)
-    if isinstance(fmt, Template):
-        template = fmt
-    else:
-        template = Template(fmt)
-    print_(obj.evaluate_template(template))
-
-
 def term_width():
    """Get the width (columns) of the terminal."""
    fallback = config['ui']['terminal_width'].get(int)
@@ -542,10 +677,11 @@ def _field_diff(field, old, new):

    # For strings, highlight changes. For others, colorize the whole
    # thing.
-    if isinstance(oldval, basestring):
+    if isinstance(oldval, six.string_types):
        oldstr, newstr = colordiff(oldval, newstr)
    else:
-        oldstr, newstr = colorize('red', oldstr), colorize('red', newstr)
+        oldstr = colorize('text_error', oldstr)
+        newstr = colorize('text_error', newstr)

    return u'{0} -> {1}'.format(oldstr, newstr)

@@ -581,18 +717,178 @@ def show_model_changes(new, old=None, fields=None, always=False):

        changes.append(u'  {0}: {1}'.format(
            field,
-            colorize('red', new.formatted()[field])
+            colorize('text_highlight', new.formatted()[field])
        ))

    # Print changes.
    if changes or always:
-        print_obj(old, old._db)
+        print_(format(old))
    if changes:
        print_(u'\n'.join(changes))

    return bool(changes)


+def show_path_changes(path_changes):
+    """Given a list of tuples (source, destination) that indicate the
+    path changes, log the changes as INFO-level output to the beets log.
+    The output is guaranteed to be unicode.
+
+    Every pair is shown on a single line if the terminal width permits it,
+    else it is split over two lines. E.g.,
+
+    Source -> Destination
+
+    vs.
+
+    Source
+      -> Destination
+    """
+    sources, destinations = zip(*path_changes)
+
+    # Ensure unicode output
+    sources = list(map(util.displayable_path, sources))
+    destinations = list(map(util.displayable_path, destinations))
+
+    # Calculate widths for terminal split
+    col_width = (term_width() - len(' -> ')) // 2
+    max_width = len(max(sources + destinations, key=len))
+
+    if max_width > col_width:
+        # Print every change over two lines
+        for source, dest in zip(sources, destinations):
+            log.info(u'{0} \n  -> {1}', source, dest)
+    else:
+        # Print every change on a single line, and add a header
+        title_pad = max_width - len('Source ') + len(' -> ')
+
+        log.info(u'Source {0} Destination', ' ' * title_pad)
+        for source, dest in zip(sources, destinations):
+            pad = max_width - len(source)
+            log.info(u'{0} {1} -> {2}', source, ' ' * pad, dest)
+
+
+class CommonOptionsParser(optparse.OptionParser, object):
+    """Offers a simple way to add common formatting options.
+
+    Options available include:
+        - matching albums instead of tracks: add_album_option()
+        - showing paths instead of items/albums: add_path_option()
+        - changing the format of displayed items/albums: add_format_option()
+
+    The last one can have several behaviors:
+        - against a special target
+        - with a certain format
+        - autodetected target with the album option
+
+    Each method is fully documented in the related method.
+    """
+    def __init__(self, *args, **kwargs):
+        super(CommonOptionsParser, self).__init__(*args, **kwargs)
+        self._album_flags = False
+        # this serves both as an indicator that we offer the feature AND allows
+        # us to check whether it has been specified on the CLI - bypassing the
+        # fact that arguments may be in any order
+
+    def add_album_option(self, flags=('-a', '--album')):
+        """Add a -a/--album option to match albums instead of tracks.
+
+        If used then the format option can auto-detect whether we're setting
+        the format for items or albums.
+        Sets the album property on the options extracted from the CLI.
+        """
+        album = optparse.Option(*flags, action='store_true',
+                                help=u'match albums instead of tracks')
+        self.add_option(album)
+        self._album_flags = set(flags)
+
+    def _set_format(self, option, opt_str, value, parser, target=None,
+                    fmt=None, store_true=False):
+        """Internal callback that sets the correct format while parsing CLI
+        arguments.
+        """
+        if store_true:
+            setattr(parser.values, option.dest, True)
+
+        # Use the explicitly specified format, or the string from the option.
+        if fmt:
+            value = fmt
+        elif value:
+            value, = decargs([value])
+        else:
+            value = u''
+
+        parser.values.format = value
+        if target:
+            config[target._format_config_key].set(value)
+        else:
+            if self._album_flags:
+                if parser.values.album:
+                    target = library.Album
+                else:
+                    # the option is either missing either not parsed yet
+                    if self._album_flags & set(parser.rargs):
+                        target = library.Album
+                    else:
+                        target = library.Item
+                config[target._format_config_key].set(value)
+            else:
+                config[library.Item._format_config_key].set(value)
+                config[library.Album._format_config_key].set(value)
+
+    def add_path_option(self, flags=('-p', '--path')):
+        """Add a -p/--path option to display the path instead of the default
+        format.
+
+        By default this affects both items and albums. If add_album_option()
+        is used then the target will be autodetected.
+
+        Sets the format property to u'$path' on the options extracted from the
+        CLI.
+        """
+        path = optparse.Option(*flags, nargs=0, action='callback',
+                               callback=self._set_format,
+                               callback_kwargs={'fmt': u'$path',
+                                                'store_true': True},
+                               help=u'print paths for matched items or albums')
+        self.add_option(path)
+
+    def add_format_option(self, flags=('-f', '--format'), target=None):
+        """Add -f/--format option to print some LibModel instances with a
+        custom format.
+
+        `target` is optional and can be one of ``library.Item``, 'item',
+        ``library.Album`` and 'album'.
+
+        Several behaviors are available:
+            - if `target` is given then the format is only applied to that
+            LibModel
+            - if the album option is used then the target will be autodetected
+            - otherwise the format is applied to both items and albums.
+
+        Sets the format property on the options extracted from the CLI.
+        """
+        kwargs = {}
+        if target:
+            if isinstance(target, six.string_types):
+                target = {'item': library.Item,
+                          'album': library.Album}[target]
+            kwargs['target'] = target
+
+        opt = optparse.Option(*flags, action='callback',
+                              callback=self._set_format,
+                              callback_kwargs=kwargs,
+                              help=u'print with custom format')
+        self.add_option(opt)
+
+    def add_all_common_options(self):
+        """Add album, path and format options.
+        """
+        self.add_album_option()
+        self.add_path_option()
+        self.add_format_option()
+
+
 # Subcommand parsing infrastructure.
 #
 # This is a fairly generic subcommand parser for optparse. It is
@@ -610,10 +906,10 @@ class Subcommand(object):
        the subcommand; aliases are alternate names. parser is an
        OptionParser responsible for parsing the subcommand's options.
        help is a short description of the command. If no parser is
-        given, it defaults to a new, empty OptionParser.
+        given, it defaults to a new, empty CommonOptionsParser.
        """
        self.name = name
-        self.parser = parser or optparse.OptionParser()
+        self.parser = parser or CommonOptionsParser()
        self.aliases = aliases
        self.help = help
        self.hide = hide
@@ -632,11 +928,11 @@ class Subcommand(object):
    @root_parser.setter
    def root_parser(self, root_parser):
        self._root_parser = root_parser
-        self.parser.prog = '{0} {1}'.format(root_parser.get_prog_name(),
-                                            self.name)
+        self.parser.prog = '{0} {1}'.format(
+            as_string(root_parser.get_prog_name()), self.name)


-class SubcommandsOptionParser(optparse.OptionParser):
+class SubcommandsOptionParser(CommonOptionsParser):
    """A variant of OptionParser that parses subcommands and their
    arguments.
    """
@@ -648,13 +944,13 @@ class SubcommandsOptionParser(optparse.OptionParser):
        """
        # A more helpful default usage.
        if 'usage' not in kwargs:
-            kwargs['usage'] = """
+            kwargs['usage'] = u"""
  %prog COMMAND [ARGS...]
  %prog help COMMAND"""
        kwargs['add_help_option'] = False

        # Super constructor.
-        optparse.OptionParser.__init__(self, *args, **kwargs)
+        super(SubcommandsOptionParser, self).__init__(*args, **kwargs)

        # Our root parser needs to stop on the first unrecognized argument.
        self.disable_interspersed_args()
@@ -671,7 +967,7 @@ class SubcommandsOptionParser(optparse.OptionParser):
    # Add the list of subcommands to the help message.
    def format_help(self, formatter=None):
        # Get the original help message, to which we will append.
-        out = optparse.OptionParser.format_help(self, formatter)
+        out = super(SubcommandsOptionParser, self).format_help(formatter)
        if formatter is None:
            formatter = self.formatter

@@ -711,7 +1007,8 @@ class SubcommandsOptionParser(optparse.OptionParser):
            result.append(name)
            help_width = formatter.width - help_position
            help_lines = textwrap.wrap(subcommand.help, help_width)
-            result.append("%*s%s\n" % (indent_first, "", help_lines[0]))
+            help_line = help_lines[0] if help_lines else ''
+            result.append("%*s%s\n" % (indent_first, "", help_line))
            result.extend(["%*s%s\n" % (help_position, "", line)
                           for line in help_lines[1:]])
        formatter.dedent()
@@ -756,7 +1053,7 @@ class SubcommandsOptionParser(optparse.OptionParser):
        cmdname = args.pop(0)
        subcommand = self._subcommand_for_name(cmdname)
        if not subcommand:
-            raise UserError("unknown command '{0}'".format(cmdname))
+            raise UserError(u"unknown command '{0}'".format(cmdname))

        suboptions, subargs = subcommand.parse_args(args)
        return subcommand, suboptions, subargs
@@ -765,53 +1062,24 @@ class SubcommandsOptionParser(optparse.OptionParser):
 optparse.Option.ALWAYS_TYPED_ACTIONS += ('callback',)


-def vararg_callback(option, opt_str, value, parser):
-    """Callback for an option with variable arguments.
-    Manually collect arguments right of a callback-action
-    option (ie. with action="callback"), and add the resulting
-    list to the destination var.
-
-    Usage:
-    parser.add_option("-c", "--callback", dest="vararg_attr",
-                      action="callback", callback=vararg_callback)
-
-    Details:
-    http://docs.python.org/2/library/optparse.html#callback-example-6-variable
-    -arguments
-    """
-    value = [value]
-
-    def floatable(str):
-        try:
-            float(str)
-            return True
-        except ValueError:
-            return False
-
-    for arg in parser.rargs:
-        # stop on --foo like options
-        if arg[:2] == "--" and len(arg) > 2:
-            break
-        # stop on -a, but not on -3 or -3.0
-        if arg[:1] == "-" and len(arg) > 1 and not floatable(arg):
-            break
-        value.append(arg)
-
-    del parser.rargs[:len(value) - 1]
-    setattr(parser.values, option.dest, value)
-
-
 # The main entry point and bootstrapping.

 def _load_plugins(config):
    """Load the plugins specified in the configuration.
    """
-    paths = config['pluginpath'].get(confit.StrSeq(split=False))
-    paths = map(util.normpath, paths)
+    paths = config['pluginpath'].as_str_seq(split=False)
+    paths = [util.normpath(p) for p in paths]
+    log.debug(u'plugin paths: {0}', util.displayable_path(paths))

+    # On Python 3, the search paths need to be unicode.
+    paths = [util.py3_path(p) for p in paths]
+
+    # Extend the `beetsplug` package to include the plugin paths.
    import beetsplug
    beetsplug.__path__ = paths + beetsplug.__path__
-    # For backwards compatibility.
+
+    # For backwards compatibility, also support plugin paths that
+    # *contain* a `beetsplug` package.
    sys.path += paths

    plugins.load_plugins(config['plugins'].as_str_seq())
@@ -840,8 +1108,8 @@ def _setup(options, lib=None):
    if lib is None:
        lib = _open_library(config)
        plugins.send("library_opened", lib=lib)
-    library.Item._types = plugins.types(library.Item)
-    library.Album._types = plugins.types(library.Album)
+    library.Item._types.update(plugins.types(library.Item))
+    library.Album._types.update(plugins.types(library.Album))

    return subcommands, plugins, lib

@@ -859,28 +1127,28 @@ def _configure(options):
    config.set_args(options)

    # Configure the logger.
-    if config['verbose'].get(bool):
-        log.setLevel(logging.DEBUG)
+    if config['verbose'].get(int):
+        log.set_global_level(logging.DEBUG)
    else:
-        log.setLevel(logging.INFO)
+        log.set_global_level(logging.INFO)

    config_path = config.user_config_path()
    if os.path.isfile(config_path):
-        log.debug(u'user configuration: {0}'.format(
-            util.displayable_path(config_path)))
+        log.debug(u'user configuration: {0}',
+                  util.displayable_path(config_path))
    else:
-        log.debug(u'no user configuration found at {0}'.format(
-            util.displayable_path(config_path)))
+        log.debug(u'no user configuration found at {0}',
+                  util.displayable_path(config_path))

-    log.debug(u'data directory: {0}'
-              .format(util.displayable_path(config.config_dir())))
+    log.debug(u'data directory: {0}',
+              util.displayable_path(config.config_dir()))
    return config


 def _open_library(config):
    """Create a new library instance from the configuration.
    """
-    dbpath = config['library'].as_filename()
+    dbpath = util.bytestring_path(config['library'].as_filename())
    try:
        lib = library.Library(
            dbpath,
@@ -890,14 +1158,14 @@ def _open_library(config):
        )
        lib.get_item(0)  # Test database connection.
    except (sqlite3.OperationalError, sqlite3.DatabaseError):
-        log.debug(traceback.format_exc())
+        log.debug(u'{}', traceback.format_exc())
        raise UserError(u"database file {0} could not be opened".format(
            util.displayable_path(dbpath)
        ))
    log.debug(u'library database: {0}\n'
-              u'library directory: {1}'
-              .format(util.displayable_path(lib.path),
-                      util.displayable_path(lib.directory)))
+              u'library directory: {1}',
+              util.displayable_path(lib.path),
+              util.displayable_path(lib.directory))
    return lib


@@ -906,16 +1174,18 @@ def _raw_main(args, lib=None):
    handling.
    """
    parser = SubcommandsOptionParser()
+    parser.add_format_option(flags=('--format-item',), target=library.Item)
+    parser.add_format_option(flags=('--format-album',), target=library.Album)
    parser.add_option('-l', '--library', dest='library',
-                      help='library database file to use')
+                      help=u'library database file to use')
    parser.add_option('-d', '--directory', dest='directory',
-                      help="destination music directory")
-    parser.add_option('-v', '--verbose', dest='verbose', action='store_true',
-                      help='print debugging information')
+                      help=u"destination music directory")
+    parser.add_option('-v', '--verbose', dest='verbose', action='count',
+                      help=u'log more details (use twice for even more)')
    parser.add_option('-c', '--config', dest='config',
-                      help='path to configuration file')
+                      help=u'path to configuration file')
    parser.add_option('-h', '--help', dest='help', action='store_true',
-                      help='how this help message and exit')
+                      help=u'show this help message and exit')
    parser.add_option('--version', dest='version', action='store_true',
                      help=optparse.SUPPRESS_HELP)

@@ -924,10 +1194,12 @@ def _raw_main(args, lib=None):
    # Special case for the `config --edit` command: bypass _setup so
    # that an invalid configuration does not prevent the editor from
    # starting.
-    if subargs[0] == 'config' and ('-e' in subargs or '--edit' in subargs):
+    if subargs and subargs[0] == 'config' \
+       and ('-e' in subargs or '--edit' in subargs):
        from beets.ui.commands import config_edit
        return config_edit()

+    test_lib = bool(lib)
    subcommands, plugins, lib = _setup(options, lib)
    parser.add_subcommand(*subcommands)

@@ -935,6 +1207,9 @@ def _raw_main(args, lib=None):
    subcommand.func(lib, suboptions, subargs)

    plugins.send('cli_exit', lib=lib)
+    if not test_lib:
+        # Clean up the library unless it came from the test harness.
+        lib._close()


 def main(args=None):
@@ -945,7 +1220,7 @@ def main(args=None):
        _raw_main(args)
    except UserError as exc:
        message = exc.args[0] if exc.args else None
-        log.error(u'error: {0}'.format(message))
+        log.error(u'error: {0}', message)
        sys.exit(1)
    except util.HumanReadableException as exc:
        exc.log(log)
@@ -953,11 +1228,14 @@ def main(args=None):
    except library.FileOperationError as exc:
        # These errors have reasonable human-readable descriptions, but
        # we still want to log their tracebacks for debugging.
-        log.debug(traceback.format_exc())
-        log.error(exc)
+        log.debug('{}', traceback.format_exc())
+        log.error('{}', exc)
        sys.exit(1)
    except confit.ConfigError as exc:
-        log.error(u'configuration error: {0}'.format(exc))
+        log.error(u'configuration error: {0}', exc)
+        sys.exit(1)
+    except db_query.InvalidQueryError as exc:
+        log.error(u'invalid query: {0}', exc)
        sys.exit(1)
    except IOError as exc:
        if exc.errno == errno.EPIPE:
@@ -967,4 +1245,4 @@ def main(args=None):
            raise
    except KeyboardInterrupt:
        # Silently ignore ^C except in verbose mode.
-        log.debug(traceback.format_exc())
+        log.debug(u'{}', traceback.format_exc())
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -13,21 +14,28 @@
 # included in all copies or substantial portions of the Software.

 """Miscellaneous utility functions."""
-from __future__ import division

+from __future__ import division, absolute_import, print_function
 import os
 import sys
+import errno
+import locale
 import re
 import shutil
 import fnmatch
-from collections import defaultdict
+from collections import Counter
 import traceback
 import subprocess
 import platform
+import shlex
+from beets.util import hidden
+import six
+from unidecode import unidecode


 MAX_FILENAME_LENGTH = 200
 WINDOWS_MAGIC_PREFIX = u'\\\\?\\'
+SNI_SUPPORTED = sys.version_info >= (2, 7, 9)


 class HumanReadableException(Exception):
@@ -54,22 +62,22 @@ class HumanReadableException(Exception):
    def _gerund(self):
        """Generate a (likely) gerund form of the English verb.
        """
-        if ' ' in self.verb:
+        if u' ' in self.verb:
            return self.verb
-        gerund = self.verb[:-1] if self.verb.endswith('e') else self.verb
-        gerund += 'ing'
+        gerund = self.verb[:-1] if self.verb.endswith(u'e') else self.verb
+        gerund += u'ing'
        return gerund

    def _reasonstr(self):
        """Get the reason as a string."""
-        if isinstance(self.reason, unicode):
+        if isinstance(self.reason, six.text_type):
            return self.reason
-        elif isinstance(self.reason, basestring):  # Byte string.
-            return self.reason.decode('utf8', 'ignore')
+        elif isinstance(self.reason, bytes):
+            return self.reason.decode('utf-8', 'ignore')
        elif hasattr(self.reason, 'strerror'):  # i.e., EnvironmentError
            return self.reason.strerror
        else:
-            return u'"{0}"'.format(unicode(self.reason))
+            return u'"{0}"'.format(six.text_type(self.reason))

    def get_message(self):
        """Create the human-readable description of the error, sans
@@ -83,7 +91,7 @@ class HumanReadableException(Exception):
        """
        if self.tb:
            logger.debug(self.tb)
-        logger.error(u'{0}: {1}'.format(self.error_kind, self.args[0]))
+        logger.error(u'{0}: {1}', self.error_kind, self.args[0])


 class FilesystemError(HumanReadableException):
@@ -149,21 +157,22 @@ def ancestry(path):
    return out


-def sorted_walk(path, ignore=(), logger=None):
+def sorted_walk(path, ignore=(), ignore_hidden=False, logger=None):
    """Like `os.walk`, but yields things in case-insensitive sorted,
    breadth-first order.  Directory and file names matching any glob
    pattern in `ignore` are skipped. If `logger` is provided, then
    warning messages are logged there when a directory cannot be listed.
    """
-    # Make sure the path isn't a Unicode string.
+    # Make sure the pathes aren't Unicode strings.
    path = bytestring_path(path)
+    ignore = [bytestring_path(i) for i in ignore]

    # Get all the directories and files at this level.
    try:
        contents = os.listdir(syspath(path))
    except OSError as exc:
        if logger:
-            logger.warn(u'could not list directory {0}: {1}'.format(
+            logger.warning(u'could not list directory {0}: {1}'.format(
                displayable_path(path), exc.strerror
            ))
        return
@@ -183,10 +192,11 @@ def sorted_walk(path, ignore=(), logger=None):

        # Add to output as either a file or a directory.
        cur = os.path.join(path, base)
-        if os.path.isdir(syspath(cur)):
-            dirs.append(base)
-        else:
-            files.append(base)
+        if (ignore_hidden and not hidden.is_hidden(cur)) or not ignore_hidden:
+            if os.path.isdir(syspath(cur)):
+                dirs.append(base)
+            else:
+                files.append(base)

    # Sort lists (case-insensitive) and yield the current level.
    dirs.sort(key=bytes.lower)
@@ -197,7 +207,7 @@ def sorted_walk(path, ignore=(), logger=None):
    for base in dirs:
        cur = os.path.join(path, base)
        # yield from sorted_walk(...)
-        for res in sorted_walk(cur, ignore, logger):
+        for res in sorted_walk(cur, ignore, ignore_hidden, logger):
            yield res


@@ -260,7 +270,9 @@ def prune_dirs(path, root=None, clutter=('.DS_Store', 'Thumbs.db')):
        if not os.path.exists(directory):
            # Directory gone already.
            continue
-        if fnmatch_all(os.listdir(directory), clutter):
+        clutter = [bytestring_path(c) for c in clutter]
+        match_paths = [bytestring_path(d) for d in os.listdir(directory)]
+        if fnmatch_all(match_paths, clutter):
            # Directory contains only clutter (or nothing).
            try:
                shutil.rmtree(directory)
@@ -294,6 +306,18 @@ def components(path):
    return comps


+def arg_encoding():
+    """Get the encoding for command-line arguments (and other OS
+    locale-sensitive strings).
+    """
+    try:
+        return locale.getdefaultlocale()[1] or 'utf-8'
+    except ValueError:
+        # Invalid locale environment variable setting. To avoid
+        # failing entirely for no good reason, assume UTF-8.
+        return 'utf-8'
+
+
 def _fsencoding():
    """Get the system's filesystem encoding. On Windows, this is always
    UTF-8 (not MBCS).
@@ -305,16 +329,16 @@ def _fsencoding():
        # for Windows paths, so the encoding is actually immaterial so
        # we can avoid dealing with this nastiness. We arbitrarily
        # choose UTF-8.
-        encoding = 'utf8'
+        encoding = 'utf-8'
    return encoding


 def bytestring_path(path):
-    """Given a path, which is either a str or a unicode, returns a str
+    """Given a path, which is either a bytes or a unicode, returns a str
    path (ensuring that we never deal with Unicode pathnames).
    """
    # Pass through bytestrings.
-    if isinstance(path, str):
+    if isinstance(path, bytes):
        return path

    # On Windows, remove the magic prefix added by `syspath`. This makes
@@ -323,11 +347,14 @@ def bytestring_path(path):
    if os.path.__name__ == 'ntpath' and path.startswith(WINDOWS_MAGIC_PREFIX):
        path = path[len(WINDOWS_MAGIC_PREFIX):]

-    # Try to encode with default encodings, but fall back to UTF8.
+    # Try to encode with default encodings, but fall back to utf-8.
    try:
        return path.encode(_fsencoding())
    except (UnicodeError, LookupError):
-        return path.encode('utf8')
+        return path.encode('utf-8')
+
+
+PATH_SEP = bytestring_path(os.sep)


 def displayable_path(path, separator=u'; '):
@@ -337,16 +364,16 @@ def displayable_path(path, separator=u'; '):
    """
    if isinstance(path, (list, tuple)):
        return separator.join(displayable_path(p) for p in path)
-    elif isinstance(path, unicode):
+    elif isinstance(path, six.text_type):
        return path
-    elif not isinstance(path, str):
+    elif not isinstance(path, bytes):
        # A non-string object: just get its unicode representation.
-        return unicode(path)
+        return six.text_type(path)

    try:
        return path.decode(_fsencoding(), 'ignore')
    except (UnicodeError, LookupError):
-        return path.decode('utf8', 'ignore')
+        return path.decode('utf-8', 'ignore')


 def syspath(path, prefix=True):
@@ -360,12 +387,12 @@ def syspath(path, prefix=True):
    if os.path.__name__ != 'ntpath':
        return path

-    if not isinstance(path, unicode):
+    if not isinstance(path, six.text_type):
        # Beets currently represents Windows paths internally with UTF-8
        # arbitrarily. But earlier versions used MBCS because it is
        # reported as the FS encoding by Windows. Try both.
        try:
-            path = path.decode('utf8')
+            path = path.decode('utf-8')
        except UnicodeError:
            # The encoding should always be MBCS, Windows' broken
            # Unicode representation.
@@ -412,7 +439,7 @@ def copy(path, dest, replace=False):
    path = syspath(path)
    dest = syspath(dest)
    if not replace and os.path.exists(dest):
-        raise FilesystemError('file exists', 'copy', (path, dest))
+        raise FilesystemError(u'file exists', 'copy', (path, dest))
    try:
        shutil.copyfile(path, dest)
    except (OSError, IOError) as exc:
@@ -433,8 +460,7 @@ def move(path, dest, replace=False):
    path = syspath(path)
    dest = syspath(dest)
    if os.path.exists(dest) and not replace:
-        raise FilesystemError('file exists', 'rename', (path, dest),
-                              traceback.format_exc())
+        raise FilesystemError(u'file exists', 'rename', (path, dest))

    # First, try renaming the file.
    try:
@@ -452,23 +478,52 @@ def move(path, dest, replace=False):
 def link(path, dest, replace=False):
    """Create a symbolic link from path to `dest`. Raises an OSError if
    `dest` already exists, unless `replace` is True. Does nothing if
-    `path` == `dest`."""
-    if (samefile(path, dest)):
+    `path` == `dest`.
+    """
+    if samefile(path, dest):
        return

-    path = syspath(path)
-    dest = syspath(dest)
-    if os.path.exists(dest) and not replace:
-        raise FilesystemError('file exists', 'rename', (path, dest),
-                              traceback.format_exc())
+    if os.path.exists(syspath(dest)) and not replace:
+        raise FilesystemError(u'file exists', 'rename', (path, dest))
    try:
-        os.symlink(path, dest)
-    except OSError:
-        raise FilesystemError('Operating system does not support symbolic '
-                              'links.', 'link', (path, dest),
+        os.symlink(syspath(path), syspath(dest))
+    except NotImplementedError:
+        # raised on python >= 3.2 and Windows versions before Vista
+        raise FilesystemError(u'OS does not support symbolic links.'
+                              'link', (path, dest), traceback.format_exc())
+    except OSError as exc:
+        # TODO: Windows version checks can be removed for python 3
+        if hasattr('sys', 'getwindowsversion'):
+            if sys.getwindowsversion()[0] < 6:  # is before Vista
+                exc = u'OS does not support symbolic links.'
+        raise FilesystemError(exc, 'link', (path, dest),
                              traceback.format_exc())


+def hardlink(path, dest, replace=False):
+    """Create a hard link from path to `dest`. Raises an OSError if
+    `dest` already exists, unless `replace` is True. Does nothing if
+    `path` == `dest`.
+    """
+    if samefile(path, dest):
+        return
+
+    if os.path.exists(syspath(dest)) and not replace:
+        raise FilesystemError(u'file exists', 'rename', (path, dest))
+    try:
+        os.link(syspath(path), syspath(dest))
+    except NotImplementedError:
+        raise FilesystemError(u'OS does not support hard links.'
+                              'link', (path, dest), traceback.format_exc())
+    except OSError as exc:
+        if exc.errno == errno.EXDEV:
+            raise FilesystemError(u'Cannot hard link across devices.'
+                                  'link', (path, dest), traceback.format_exc())
+        else:
+            raise FilesystemError(exc, 'link', (path, dest),
+                                  traceback.format_exc())
+
+
 def unique_path(path):
    """Returns a version of ``path`` that does not exist on the
    filesystem. Specifically, if ``path` itself already exists, then
@@ -478,7 +533,7 @@ def unique_path(path):
        return path

    base, ext = os.path.splitext(path)
-    match = re.search(r'\.(\d)+$', base)
+    match = re.search(br'\.(\d)+$', base)
    if match:
        num = int(match.group(1))
        base = base[:match.start()]
@@ -486,7 +541,8 @@ def unique_path(path):
        num = 0
    while True:
        num += 1
-        new_path = '%s.%i%s' % (base, num, ext)
+        suffix = u'.{}'.format(num).encode() + ext
+        new_path = base + suffix
        if not os.path.exists(new_path):
            return new_path

@@ -495,12 +551,12 @@ def unique_path(path):
 # shares, which are sufficiently common as to cause frequent problems.
 # http://msdn.microsoft.com/en-us/library/windows/desktop/aa365247.aspx
 CHAR_REPLACE = [
-    (re.compile(ur'[\\/]'), u'_'),  # / and \ -- forbidden everywhere.
-    (re.compile(ur'^\.'), u'_'),  # Leading dot (hidden files on Unix).
-    (re.compile(ur'[\x00-\x1f]'), u''),  # Control characters.
-    (re.compile(ur'[<>:"\?\*\|]'), u'_'),  # Windows "reserved characters".
-    (re.compile(ur'\.$'), u'_'),  # Trailing dots.
-    (re.compile(ur'\s+$'), u''),  # Trailing whitespace.
+    (re.compile(r'[\\/]'), u'_'),  # / and \ -- forbidden everywhere.
+    (re.compile(r'^\.'), u'_'),  # Leading dot (hidden files on Unix).
+    (re.compile(r'[\x00-\x1f]'), u''),  # Control characters.
+    (re.compile(r'[<>:"\?\*\|]'), u'_'),  # Windows "reserved characters".
+    (re.compile(r'\.$'), u'_'),  # Trailing dots.
+    (re.compile(r'\s+$'), u''),  # Trailing whitespace.
 ]


@@ -542,73 +598,142 @@ def truncate_path(path, length=MAX_FILENAME_LENGTH):
    return os.path.join(*out)


+def _legalize_stage(path, replacements, length, extension, fragment):
+    """Perform a single round of path legalization steps
+    (sanitation/replacement, encoding from Unicode to bytes,
+    extension-appending, and truncation). Return the path (Unicode if
+    `fragment` is set, `bytes` otherwise) and whether truncation was
+    required.
+    """
+    # Perform an initial sanitization including user replacements.
+    path = sanitize_path(path, replacements)
+
+    # Encode for the filesystem.
+    if not fragment:
+        path = bytestring_path(path)
+
+    # Preserve extension.
+    path += extension.lower()
+
+    # Truncate too-long components.
+    pre_truncate_path = path
+    path = truncate_path(path, length)
+
+    return path, path != pre_truncate_path
+
+
+def legalize_path(path, replacements, length, extension, fragment):
+    """Given a path-like Unicode string, produce a legal path. Return
+    the path and a flag indicating whether some replacements had to be
+    ignored (see below).
+
+    The legalization process (see `_legalize_stage`) consists of
+    applying the sanitation rules in `replacements`, encoding the string
+    to bytes (unless `fragment` is set), truncating components to
+    `length`, appending the `extension`.
+
+    This function performs up to three calls to `_legalize_stage` in
+    case truncation conflicts with replacements (as can happen when
+    truncation creates whitespace at the end of the string, for
+    example). The limited number of iterations iterations avoids the
+    possibility of an infinite loop of sanitation and truncation
+    operations, which could be caused by replacement rules that make the
+    string longer. The flag returned from this function indicates that
+    the path has to be truncated twice (indicating that replacements
+    made the string longer again after it was truncated); the
+    application should probably log some sort of warning.
+    """
+
+    if fragment:
+        # Outputting Unicode.
+        extension = extension.decode('utf-8', 'ignore')
+
+    first_stage_path, _ = _legalize_stage(
+        path, replacements, length, extension, fragment
+    )
+
+    # Convert back to Unicode with extension removed.
+    first_stage_path, _ = os.path.splitext(displayable_path(first_stage_path))
+
+    # Re-sanitize following truncation (including user replacements).
+    second_stage_path, retruncated = _legalize_stage(
+        first_stage_path, replacements, length, extension, fragment
+    )
+
+    # If the path was once again truncated, discard user replacements
+    # and run through one last legalization stage.
+    if retruncated:
+        second_stage_path, _ = _legalize_stage(
+            first_stage_path, None, length, extension, fragment
+        )
+
+    return second_stage_path, retruncated
+
+
+def py3_path(path):
+    """Convert a bytestring path to Unicode on Python 3 only. On Python
+    2, return the bytestring path unchanged.
+
+    This helps deal with APIs on Python 3 that *only* accept Unicode
+    (i.e., `str` objects). I philosophically disagree with this
+    decision, because paths are sadly bytes on Unix, but that's the way
+    it is. So this function helps us "smuggle" the true bytes data
+    through APIs that took Python 3's Unicode mandate too seriously.
+    """
+    if isinstance(path, six.text_type):
+        return path
+    assert isinstance(path, bytes)
+    if six.PY2:
+        return path
+    return os.fsdecode(path)
+
+
 def str2bool(value):
    """Returns a boolean reflecting a human-entered string."""
-    if value.lower() in ('yes', '1', 'true', 't', 'y'):
-        return True
-    else:
-        return False
+    return value.lower() in (u'yes', u'1', u'true', u't', u'y')


 def as_string(value):
    """Convert a value to a Unicode object for matching with a query.
    None becomes the empty string. Bytestrings are silently decoded.
    """
+    if six.PY2:
+        buffer_types = buffer, memoryview  # noqa: F821
+    else:
+        buffer_types = memoryview
+
    if value is None:
        return u''
-    elif isinstance(value, buffer):
-        return str(value).decode('utf8', 'ignore')
-    elif isinstance(value, str):
-        return value.decode('utf8', 'ignore')
+    elif isinstance(value, buffer_types):
+        return bytes(value).decode('utf-8', 'ignore')
+    elif isinstance(value, bytes):
+        return value.decode('utf-8', 'ignore')
    else:
-        return unicode(value)
+        return six.text_type(value)


-def levenshtein(s1, s2):
-    """A nice DP edit distance implementation from Wikibooks:
-    http://en.wikibooks.org/wiki/Algorithm_implementation/Strings/
-    Levenshtein_distance#Python
+def text_string(value, encoding='utf-8'):
+    """Convert a string, which can either be bytes or unicode, to
+    unicode.
+
+    Text (unicode) is left untouched; bytes are decoded. This is useful
+    to convert from a "native string" (bytes on Python 2, str on Python
+    3) to a consistently unicode value.
    """
-    if len(s1) < len(s2):
-        return levenshtein(s2, s1)
-    if not s1:
-        return len(s2)
-
-    previous_row = xrange(len(s2) + 1)
-    for i, c1 in enumerate(s1):
-        current_row = [i + 1]
-        for j, c2 in enumerate(s2):
-            insertions = previous_row[j + 1] + 1
-            deletions = current_row[j] + 1
-            substitutions = previous_row[j] + (c1 != c2)
-            current_row.append(min(insertions, deletions, substitutions))
-        previous_row = current_row
-
-    return previous_row[-1]
+    if isinstance(value, bytes):
+        return value.decode(encoding)
+    return value


 def plurality(objs):
-    """Given a sequence of comparable objects, returns the object that
-    is most common in the set and the frequency of that object. The
+    """Given a sequence of hashble objects, returns the object that
+    is most common in the set and the its number of appearance. The
    sequence must contain at least one object.
    """
-    # Calculate frequencies.
-    freqs = defaultdict(int)
-    for obj in objs:
-        freqs[obj] += 1
-
-    if not freqs:
-        raise ValueError('sequence must be non-empty')
-
-    # Find object with maximum frequency.
-    max_freq = 0
-    res = None
-    for obj, freq in freqs.items():
-        if freq > max_freq:
-            max_freq = freq
-            res = obj
-
-    return res, max_freq
+    c = Counter(objs)
+    if not c:
+        raise ValueError(u'sequence must be non-empty')
+    return c.most_common(1)[0]


 def cpu_count():
@@ -624,8 +749,8 @@ def cpu_count():
            num = 0
    elif sys.platform == 'darwin':
        try:
-            num = int(command_output(['sysctl', '-n', 'hw.ncpu']))
-        except ValueError:
+            num = int(command_output(['/usr/sbin/sysctl', '-n', 'hw.ncpu']))
+        except (ValueError, OSError, subprocess.CalledProcessError):
            num = 0
    else:
        try:
@@ -638,21 +763,40 @@ def cpu_count():
        return 1


+def convert_command_args(args):
+    """Convert command arguments to bytestrings on Python 2 and
+    surrogate-escaped strings on Python 3."""
+    assert isinstance(args, list)
+
+    def convert(arg):
+        if six.PY2:
+            if isinstance(arg, six.text_type):
+                arg = arg.encode(arg_encoding())
+        else:
+            if isinstance(arg, bytes):
+                arg = arg.decode(arg_encoding(), 'surrogateescape')
+        return arg
+
+    return [convert(a) for a in args]
+
+
 def command_output(cmd, shell=False):
    """Runs the command and returns its output after it has exited.

-    ``cmd`` is a list of arguments starting with the command names.  If
-    ``shell`` is true, ``cmd`` is assumed to be a string and passed to a
+    ``cmd`` is a list of arguments starting with the command names. The
+    arguments are bytes on Unix and strings on Windows.
+    If ``shell`` is true, ``cmd`` is assumed to be a string and passed to a
    shell to execute.

    If the process exits with a non-zero return code
    ``subprocess.CalledProcessError`` is raised. May also raise
    ``OSError``.

-    This replaces `subprocess.check_output`, which isn't available in
-    Python 2.6 and which can have problems if lots of output is sent to
-    stderr.
+    This replaces `subprocess.check_output` which can have problems if lots of
+    output is sent to stderr.
    """
+    cmd = convert_command_args(cmd)
+
    proc = subprocess.Popen(
        cmd,
        stdout=subprocess.PIPE,
@@ -665,6 +809,7 @@ def command_output(cmd, shell=False):
        raise subprocess.CalledProcessError(
            returncode=proc.returncode,
            cmd=' '.join(cmd),
+            output=stdout + stderr,
        )
    return stdout

@@ -684,3 +829,165 @@ def max_filename_length(path, limit=MAX_FILENAME_LENGTH):
        return min(res[9], limit)
    else:
        return limit
+
+
+def open_anything():
+    """Return the system command that dispatches execution to the correct
+    program.
+    """
+    sys_name = platform.system()
+    if sys_name == 'Darwin':
+        base_cmd = 'open'
+    elif sys_name == 'Windows':
+        base_cmd = 'start'
+    else:  # Assume Unix
+        base_cmd = 'xdg-open'
+    return base_cmd
+
+
+def editor_command():
+    """Get a command for opening a text file.
+
+    Use the `EDITOR` environment variable by default. If it is not
+    present, fall back to `open_anything()`, the platform-specific tool
+    for opening files in general.
+    """
+    editor = os.environ.get('EDITOR')
+    if editor:
+        return editor
+    return open_anything()
+
+
+def shlex_split(s):
+    """Split a Unicode or bytes string according to shell lexing rules.
+
+    Raise `ValueError` if the string is not a well-formed shell string.
+    This is a workaround for a bug in some versions of Python.
+    """
+    if not six.PY2 or isinstance(s, bytes):  # Shlex works fine.
+        return shlex.split(s)
+
+    elif isinstance(s, six.text_type):
+        # Work around a Python bug.
+        # http://bugs.python.org/issue6988
+        bs = s.encode('utf-8')
+        return [c.decode('utf-8') for c in shlex.split(bs)]
+
+    else:
+        raise TypeError(u'shlex_split called with non-string')
+
+
+def interactive_open(targets, command):
+    """Open the files in `targets` by `exec`ing a new `command`, given
+    as a Unicode string. (The new program takes over, and Python
+    execution ends: this does not fork a subprocess.)
+
+    Can raise `OSError`.
+    """
+    assert command
+
+    # Split the command string into its arguments.
+    try:
+        args = shlex_split(command)
+    except ValueError:  # Malformed shell tokens.
+        args = [command]
+
+    args.insert(0, args[0])  # for argv[0]
+
+    args += targets
+
+    return os.execlp(*args)
+
+
+def _windows_long_path_name(short_path):
+    """Use Windows' `GetLongPathNameW` via ctypes to get the canonical,
+    long path given a short filename.
+    """
+    if not isinstance(short_path, six.text_type):
+        short_path = short_path.decode(_fsencoding())
+
+    import ctypes
+    buf = ctypes.create_unicode_buffer(260)
+    get_long_path_name_w = ctypes.windll.kernel32.GetLongPathNameW
+    return_value = get_long_path_name_w(short_path, buf, 260)
+
+    if return_value == 0 or return_value > 260:
+        # An error occurred
+        return short_path
+    else:
+        long_path = buf.value
+        # GetLongPathNameW does not change the case of the drive
+        # letter.
+        if len(long_path) > 1 and long_path[1] == ':':
+            long_path = long_path[0].upper() + long_path[1:]
+        return long_path
+
+
+def case_sensitive(path):
+    """Check whether the filesystem at the given path is case sensitive.
+
+    To work best, the path should point to a file or a directory. If the path
+    does not exist, assume a case sensitive file system on every platform
+    except Windows.
+    """
+    # A fallback in case the path does not exist.
+    if not os.path.exists(syspath(path)):
+        # By default, the case sensitivity depends on the platform.
+        return platform.system() != 'Windows'
+
+    # If an upper-case version of the path exists but a lower-case
+    # version does not, then the filesystem must be case-sensitive.
+    # (Otherwise, we have more work to do.)
+    if not (os.path.exists(syspath(path.lower())) and
+            os.path.exists(syspath(path.upper()))):
+        return True
+
+    # Both versions of the path exist on the file system. Check whether
+    # they refer to different files by their inodes. Alas,
+    # `os.path.samefile` is only available on Unix systems on Python 2.
+    if platform.system() != 'Windows':
+        return not os.path.samefile(syspath(path.lower()),
+                                    syspath(path.upper()))
+
+    # On Windows, we check whether the canonical, long filenames for the
+    # files are the same.
+    lower = _windows_long_path_name(path.lower())
+    upper = _windows_long_path_name(path.upper())
+    return lower != upper
+
+
+def raw_seconds_short(string):
+    """Formats a human-readable M:SS string as a float (number of seconds).
+
+    Raises ValueError if the conversion cannot take place due to `string` not
+    being in the right format.
+    """
+    match = re.match(r'^(\d+):([0-5]\d)$', string)
+    if not match:
+        raise ValueError(u'String not in M:SS format')
+    minutes, seconds = map(int, match.groups())
+    return float(minutes * 60 + seconds)
+
+
+def asciify_path(path, sep_replace):
+    """Decodes all unicode characters in a path into ASCII equivalents.
+
+    Substitutions are provided by the unidecode module. Path separators in the
+    input are preserved.
+
+    Keyword arguments:
+    path -- The path to be asciified.
+    sep_replace -- the string to be used to replace extraneous path separators.
+    """
+    # if this platform has an os.altsep, change it to os.sep.
+    if os.altsep:
+        path = path.replace(os.altsep, os.sep)
+    path_components = path.split(os.sep)
+    for index, item in enumerate(path_components):
+        path_components[index] = unidecode(item).replace(os.sep, sep_replace)
+        if os.altsep:
+            path_components[index] = unidecode(item).replace(
+                os.altsep,
+                sep_replace
+            )
+    return os.sep.join(path_components)
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2014, Fabrice Laporte
+# Copyright 2016, Fabrice Laporte
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -15,20 +16,26 @@
 """Abstraction layer to resize images using PIL, ImageMagick, or a
 public resizing proxy if neither is available.
 """
-import urllib
+from __future__ import division, absolute_import, print_function
+
 import subprocess
 import os
 import re
 from tempfile import NamedTemporaryFile
-import logging
+from six.moves.urllib.parse import urlencode
+from beets import logging
 from beets import util
+import six

 # Resizing methods
 PIL = 1
 IMAGEMAGICK = 2
 WEBPROXY = 3

-PROXY_URL = 'http://images.weserv.nl/'
+if util.SNI_SUPPORTED:
+    PROXY_URL = 'https://images.weserv.nl/'
+else:
+    PROXY_URL = 'http://images.weserv.nl/'

 log = logging.getLogger('beets')

@@ -37,9 +44,9 @@ def resize_url(url, maxwidth):
    """Return a proxied image URL that resizes the original image to
    maxwidth (preserving aspect ratio).
    """
-    return '{0}?{1}'.format(PROXY_URL, urllib.urlencode({
+    return '{0}?{1}'.format(PROXY_URL, urlencode({
        'url': url.replace('http://', ''),
-        'w': str(maxwidth),
+        'w': maxwidth,
    }))


@@ -48,8 +55,8 @@ def temp_file_for(path):
    specified path.
    """
    ext = os.path.splitext(path)[1]
-    with NamedTemporaryFile(suffix=ext, delete=False) as f:
-        return f.name
+    with NamedTemporaryFile(suffix=util.py3_path(ext), delete=False) as f:
+        return util.bytestring_path(f.name)


 def pil_resize(maxwidth, path_in, path_out=None):
@@ -58,9 +65,8 @@ def pil_resize(maxwidth, path_in, path_out=None):
    """
    path_out = path_out or temp_file_for(path_in)
    from PIL import Image
-    log.debug(u'artresizer: PIL resizing {0} to {1}'.format(
-        util.displayable_path(path_in), util.displayable_path(path_out)
-    ))
+    log.debug(u'artresizer: PIL resizing {0} to {1}',
+              util.displayable_path(path_in), util.displayable_path(path_out))

    try:
        im = Image.open(util.syspath(path_in))
@@ -69,9 +75,8 @@ def pil_resize(maxwidth, path_in, path_out=None):
        im.save(path_out)
        return path_out
    except IOError:
-        log.error(u"PIL cannot create thumbnail for '{0}'".format(
-            util.displayable_path(path_in)
-        ))
+        log.error(u"PIL cannot create thumbnail for '{0}'",
+                  util.displayable_path(path_in))
        return path_in


@@ -80,9 +85,8 @@ def im_resize(maxwidth, path_in, path_out=None):
    Return the output path of resized image.
    """
    path_out = path_out or temp_file_for(path_in)
-    log.debug(u'artresizer: ImageMagick resizing {0} to {1}'.format(
-        util.displayable_path(path_in), util.displayable_path(path_out)
-    ))
+    log.debug(u'artresizer: ImageMagick resizing {0} to {1}',
+              util.displayable_path(path_in), util.displayable_path(path_out))

    # "-resize widthxheight>" shrinks images with dimension(s) larger
    # than the corresponding width and/or height dimension(s). The >
@@ -90,13 +94,13 @@ def im_resize(maxwidth, path_in, path_out=None):
    # compatibility.
    try:
        util.command_output([
-            'convert', util.syspath(path_in),
-            '-resize', '{0}x^>'.format(maxwidth), path_out
+            'convert', util.syspath(path_in, prefix=False),
+            '-resize', '{0}x^>'.format(maxwidth),
+            util.syspath(path_out, prefix=False),
        ])
    except subprocess.CalledProcessError:
-        log.warn(u'artresizer: IM convert failed for {0}'.format(
-            util.displayable_path(path_in)
-        ))
+        log.warning(u'artresizer: IM convert failed for {0}',
+                    util.displayable_path(path_in))
        return path_in
    return path_out

@@ -107,34 +111,67 @@ BACKEND_FUNCS = {
 }


+def pil_getsize(path_in):
+    from PIL import Image
+    try:
+        im = Image.open(util.syspath(path_in))
+        return im.size
+    except IOError as exc:
+        log.error(u"PIL could not read file {}: {}",
+                  util.displayable_path(path_in), exc)
+
+
+def im_getsize(path_in):
+    cmd = ['identify', '-format', '%w %h',
+           util.syspath(path_in, prefix=False)]
+    try:
+        out = util.command_output(cmd)
+    except subprocess.CalledProcessError as exc:
+        log.warning(u'ImageMagick size query failed')
+        log.debug(
+            u'`convert` exited with (status {}) when '
+            u'getting size with command {}:\n{}',
+            exc.returncode, cmd, exc.output.strip()
+        )
+        return
+    try:
+        return tuple(map(int, out.split(b' ')))
+    except IndexError:
+        log.warning(u'Could not understand IM output: {0!r}', out)
+
+
+BACKEND_GET_SIZE = {
+    PIL: pil_getsize,
+    IMAGEMAGICK: im_getsize,
+}
+
+
 class Shareable(type):
    """A pseudo-singleton metaclass that allows both shared and
    non-shared instances. The ``MyClass.shared`` property holds a
    lazily-created shared instance of ``MyClass`` while calling
    ``MyClass()`` to construct a new object works as usual.
    """
-    def __init__(cls, name, bases, dict):
-        super(Shareable, cls).__init__(name, bases, dict)
-        cls._instance = None
+    def __init__(self, name, bases, dict):
+        super(Shareable, self).__init__(name, bases, dict)
+        self._instance = None

    @property
-    def shared(cls):
-        if cls._instance is None:
-            cls._instance = cls()
-        return cls._instance
+    def shared(self):
+        if self._instance is None:
+            self._instance = self()
+        return self._instance


-class ArtResizer(object):
+class ArtResizer(six.with_metaclass(Shareable, object)):
    """A singleton class that performs image resizes.
    """
-    __metaclass__ = Shareable

-    def __init__(self, method=None):
-        """Create a resizer object for the given method or, if none is
-        specified, with an inferred method.
+    def __init__(self):
+        """Create a resizer object with an inferred method.
        """
-        self.method = self._check_method(method)
-        log.debug(u"artresizer: method is {0}".format(self.method))
+        self.method = self._check_method()
+        log.debug(u"artresizer: method is {0}", self.method)
        self.can_compare = self._can_compare()

    def resize(self, maxwidth, path_in, path_out=None):
@@ -165,47 +202,61 @@ class ArtResizer(object):
        """
        return self.method[0] in BACKEND_FUNCS

+    def get_size(self, path_in):
+        """Return the size of an image file as an int couple (width, height)
+        in pixels.
+
+        Only available locally
+        """
+        if self.local:
+            func = BACKEND_GET_SIZE[self.method[0]]
+            return func(path_in)
+
    def _can_compare(self):
        """A boolean indicating whether image comparison is available"""

        return self.method[0] == IMAGEMAGICK and self.method[1] > (6, 8, 7)

    @staticmethod
-    def _check_method(method=None):
-        """A tuple indicating whether current method is available and its
-        version. If no method is given, it returns a supported one.
-        """
-        # Guess available method
-        if not method:
-            for m in [IMAGEMAGICK, PIL]:
-                _, version = ArtResizer._check_method(m)
-                if version:
-                    return (m, version)
-            return (WEBPROXY, (0))
+    def _check_method():
+        """Return a tuple indicating an available method and its version."""
+        version = get_im_version()
+        if version:
+            return IMAGEMAGICK, version

-        if method == IMAGEMAGICK:
+        version = get_pil_version()
+        if version:
+            return PIL, version

-            # Try invoking ImageMagick's "convert".
-            try:
-                out = util.command_output(['identify', '--version'])
+        return WEBPROXY, (0)

-                if 'imagemagick' in out.lower():
-                    pattern = r".+ (\d+)\.(\d+)\.(\d+).*"
-                    match = re.search(pattern, out)
-                    if match:
-                        return (IMAGEMAGICK,
-                                (int(match.group(1)),
-                                 int(match.group(2)),
-                                 int(match.group(3))))
-                    return (IMAGEMAGICK, (0))

-            except (subprocess.CalledProcessError, OSError):
-                return (IMAGEMAGICK, None)
+def get_im_version():
+    """Return Image Magick version or None if it is unavailable
+    Try invoking ImageMagick's "convert".
+    """
+    try:
+        out = util.command_output(['convert', '--version'])

-        if method == PIL:
-            # Try importing PIL.
-            try:
-                __import__('PIL', fromlist=['Image'])
-                return (PIL, (0))
-            except ImportError:
-                return (PIL, None)
+        if b'imagemagick' in out.lower():
+            pattern = br".+ (\d+)\.(\d+)\.(\d+).*"
+            match = re.search(pattern, out)
+            if match:
+                return (int(match.group(1)),
+                        int(match.group(2)),
+                        int(match.group(3)))
+            return (0,)
+
+    except (subprocess.CalledProcessError, OSError) as exc:
+        log.debug(u'ImageMagick check `convert --version` failed: {}', exc)
+        return None
+
+
+def get_pil_version():
+    """Return Image Magick version or None if it is unavailable
+    Try importing PIL."""
+    try:
+        __import__('PIL', fromlist=[str('Image')])
+        return (0,)
+    except ImportError:
+        return None
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 """Extremely simple pure-Python implementation of coroutine-style
 asynchronous socket I/O. Inspired by, but inferior to, Eventlet.
 Bluelet can also be thought of as a less-terrible replacement for
@@ -5,6 +7,9 @@ asyncore.

 Bluelet: easy concurrency without all the messy parallelism.
 """
+from __future__ import division, absolute_import, print_function
+
+import six
 import socket
 import select
 import sys
@@ -15,20 +20,6 @@ import time
 import collections


-# A little bit of "six" (Python 2/3 compatibility): cope with PEP 3109 syntax
-# changes.
-
-PY3 = sys.version_info[0] == 3
-if PY3:
-    def _reraise(typ, exc, tb):
-        raise exc.with_traceback(tb)
-else:
-    exec("""
-def _reraise(typ, exc, tb):
-    raise typ, exc, tb
-""")
-
-
 # Basic events used for thread scheduling.

 class Event(object):
@@ -210,7 +201,7 @@ class ThreadException(Exception):
        self.exc_info = exc_info

    def reraise(self):
-        _reraise(self.exc_info[0], self.exc_info[1], self.exc_info[2])
+        six.reraise(self.exc_info[0], self.exc_info[1], self.exc_info[2])


 SUSPENDED = Event()  # Special sentinel placeholder for suspended threads.
@@ -550,7 +541,7 @@ def spawn(coro):
    and child coroutines run concurrently.
    """
    if not isinstance(coro, types.GeneratorType):
-        raise ValueError('%s is not a coroutine' % str(coro))
+        raise ValueError(u'%s is not a coroutine' % coro)
    return SpawnEvent(coro)


@@ -560,7 +551,7 @@ def call(coro):
    returns a value using end(), then this event returns that value.
    """
    if not isinstance(coro, types.GeneratorType):
-        raise ValueError('%s is not a coroutine' % str(coro))
+        raise ValueError(u'%s is not a coroutine' % coro)
    return DelegationEvent(coro)


@@ -1,5 +1,6 @@
-# This file is part of Confit.
-# Copyright 2014, Adrian Sampson.
+# -*- coding: utf-8 -*-
+# This file is part of Confuse.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -14,19 +15,16 @@

 """Worry-free YAML configuration files.
 """
-from __future__ import unicode_literals
+from __future__ import division, absolute_import, print_function
+
 import platform
 import os
 import pkgutil
 import sys
 import yaml
-import types
 import collections
 import re
-try:
-    from collections import OrderedDict
-except ImportError:
-    from ordereddict import OrderedDict
+from collections import OrderedDict

 UNIX_DIR_VAR = 'XDG_CONFIG_HOME'
 UNIX_DIR_FALLBACK = '~/.config'
@@ -40,14 +38,15 @@ ROOT_NAME = 'root'

 YAML_TAB_PROBLEM = "found character '\\t' that cannot start any token"

+REDACTED_TOMBSTONE = 'REDACTED'
+

 # Utilities.

 PY3 = sys.version_info[0] == 3
-STRING = str if PY3 else unicode
-BASESTRING = str if PY3 else basestring
-NUMERIC_TYPES = (int, float) if PY3 else (int, float, long)
-TYPE_TYPES = (type,) if PY3 else (type, types.ClassType)
+STRING = str if PY3 else unicode  # noqa: F821
+BASESTRING = str if PY3 else basestring  # noqa: F821
+NUMERIC_TYPES = (int, float) if PY3 else (int, float, long)  # noqa: F821


 def iter_first(sequence):
@@ -56,10 +55,7 @@ def iter_first(sequence):
    """
    it = iter(sequence)
    try:
-        if PY3:
-            return next(it)
-        else:
-            return it.next()
+        return next(it)
    except StopIteration:
        raise ValueError()

@@ -96,17 +92,17 @@ class ConfigReadError(ConfigError):
        self.filename = filename
        self.reason = reason

-        message = 'file {0} could not be read'.format(filename)
+        message = u'file {0} could not be read'.format(filename)
        if isinstance(reason, yaml.scanner.ScannerError) and \
                reason.problem == YAML_TAB_PROBLEM:
            # Special-case error message for tab indentation in YAML markup.
-            message += ': found tab character at line {0}, column {1}'.format(
+            message += u': found tab character at line {0}, column {1}'.format(
                reason.problem_mark.line + 1,
                reason.problem_mark.column + 1,
            )
        elif reason:
            # Generic error message uses exception's message.
-            message += ': {0}'.format(reason)
+            message += u': {0}'.format(reason)

        super(ConfigReadError, self).__init__(message)

@@ -120,19 +116,19 @@ class ConfigSource(dict):
    def __init__(self, value, filename=None, default=False):
        super(ConfigSource, self).__init__(value)
        if filename is not None and not isinstance(filename, BASESTRING):
-            raise TypeError('filename must be a string or None')
+            raise TypeError(u'filename must be a string or None')
        self.filename = filename
        self.default = default

    def __repr__(self):
-        return 'ConfigSource({0}, {1}, {2})'.format(
-            super(ConfigSource, self).__repr__(),
-            repr(self.filename),
-            repr(self.default)
+        return 'ConfigSource({0!r}, {1!r}, {2!r})'.format(
+            super(ConfigSource, self),
+            self.filename,
+            self.default,
        )

    @classmethod
-    def of(self, value):
+    def of(cls, value):
        """Given either a dictionary or a `ConfigSource` object, return
        a `ConfigSource` object. This lets a function accept either type
        of object as an argument.
@@ -142,7 +138,7 @@ class ConfigSource(dict):
        elif isinstance(value, dict):
            return ConfigSource(value)
        else:
-            raise TypeError('source value must be a dict')
+            raise TypeError(u'source value must be a dict')


 class ConfigView(object):
@@ -177,7 +173,7 @@ class ConfigView(object):
        try:
            return iter_first(pairs)
        except ValueError:
-            raise NotFoundError("{0} not found".format(self.name))
+            raise NotFoundError(u"{0} not found".format(self.name))

    def exists(self):
        """Determine whether the view has a setting in any source.
@@ -208,7 +204,31 @@ class ConfigView(object):
        raise NotImplementedError

    def __repr__(self):
-        return '<ConfigView: %s>' % self.name
+        return '<{}: {}>'.format(self.__class__.__name__, self.name)
+
+    def __iter__(self):
+        """Iterate over the keys of a dictionary view or the *subviews*
+        of a list view.
+        """
+        # Try getting the keys, if this is a dictionary view.
+        try:
+            keys = self.keys()
+            for key in keys:
+                yield key
+
+        except ConfigTypeError:
+            # Otherwise, try iterating over a list.
+            collection = self.get()
+            if not isinstance(collection, (list, tuple)):
+                raise ConfigTypeError(
+                    u'{0} must be a dictionary or a list, not {1}'.format(
+                        self.name, type(collection).__name__
+                    )
+                )
+
+            # Yield all the indices in the list.
+            for index in range(len(collection)):
+                yield self[index]

    def __getitem__(self, key):
        """Get a subview of this view."""
@@ -225,10 +245,15 @@ class ConfigView(object):

    def set_args(self, namespace):
        """Overlay parsed command-line arguments, generated by a library
-        like argparse or optparse, onto this view's value.
+        like argparse or optparse, onto this view's value. ``namespace``
+        can be a ``dict`` or namespace object.
        """
        args = {}
-        for key, value in namespace.__dict__.items():
+        if isinstance(namespace, dict):
+            items = namespace.items()
+        else:
+            items = namespace.__dict__.items()
+        for key, value in items:
            if value is not None:  # Avoid unset options.
                args[key] = value
        self.set(args)
@@ -239,14 +264,17 @@ class ConfigView(object):
    # just say ``bool(view)`` or use ``view`` in a conditional.

    def __str__(self):
-        """Gets the value for this view as a byte string."""
-        return str(self.get())
+        """Get the value for this view as a bytestring.
+        """
+        if PY3:
+            return self.__unicode__()
+        else:
+            return bytes(self.get())

    def __unicode__(self):
-        """Gets the value for this view as a unicode string. (Python 2
-        only.)
+        """Get the value for this view as a Unicode string.
        """
-        return unicode(self.get())
+        return STRING(self.get())

    def __nonzero__(self):
        """Gets the value for this view as a boolean. (Python 2 only.)
@@ -276,7 +304,7 @@ class ConfigView(object):
                cur_keys = dic.keys()
            except AttributeError:
                raise ConfigTypeError(
-                    '{0} must be a dict, not {1}'.format(
+                    u'{0} must be a dict, not {1}'.format(
                        self.name, type(dic).__name__
                    )
                )
@@ -317,7 +345,7 @@ class ConfigView(object):
                it = iter(collection)
            except TypeError:
                raise ConfigTypeError(
-                    '{0} must be an iterable, not {1}'.format(
+                    u'{0} must be an iterable, not {1}'.format(
                        self.name, type(collection).__name__
                    )
                )
@@ -326,17 +354,23 @@ class ConfigView(object):

    # Validation and conversion.

-    def flatten(self):
+    def flatten(self, redact=False):
        """Create a hierarchy of OrderedDicts containing the data from
        this view, recursively reifying all views to get their
        represented values.
+
+        If `redact` is set, then sensitive values are replaced with
+        the string "REDACTED".
        """
        od = OrderedDict()
        for key, view in self.items():
-            try:
-                od[key] = view.flatten()
-            except ConfigTypeError:
-                od[key] = view.get()
+            if redact and view.redact:
+                od[key] = REDACTED_TOMBSTONE
+            else:
+                try:
+                    od[key] = view.flatten(redact=redact)
+                except ConfigTypeError:
+                    od[key] = view.get()
        return od

    def get(self, template=None):
@@ -354,19 +388,60 @@ class ConfigView(object):
        """
        return as_template(template).value(self, template)

-    # Old validation methods (deprecated).
+    # Shortcuts for common templates.

    def as_filename(self):
+        """Get the value as a path. Equivalent to `get(Filename())`.
+        """
        return self.get(Filename())

    def as_choice(self, choices):
+        """Get the value from a list of choices. Equivalent to
+        `get(Choice(choices))`.
+        """
        return self.get(Choice(choices))

    def as_number(self):
+        """Get the value as any number type: int or float. Equivalent to
+        `get(Number())`.
+        """
        return self.get(Number())

-    def as_str_seq(self):
-        return self.get(StrSeq())
+    def as_str_seq(self, split=True):
+        """Get the value as a sequence of strings. Equivalent to
+        `get(StrSeq())`.
+        """
+        return self.get(StrSeq(split=split))
+
+    def as_str(self):
+        """Get the value as a (Unicode) string. Equivalent to
+        `get(unicode)` on Python 2 and `get(str)` on Python 3.
+        """
+        return self.get(String())
+
+    # Redaction.
+
+    @property
+    def redact(self):
+        """Whether the view contains sensitive information and should be
+        redacted from output.
+        """
+        return () in self.get_redactions()
+
+    @redact.setter
+    def redact(self, flag):
+        self.set_redaction((), flag)
+
+    def set_redaction(self, path, flag):
+        """Add or remove a redaction for a key path, which should be an
+        iterable of keys.
+        """
+        raise NotImplementedError()
+
+    def get_redactions(self):
+        """Get the set of currently-redacted sub-key-paths at this view.
+        """
+        raise NotImplementedError()


 class RootView(ConfigView):
@@ -380,6 +455,7 @@ class RootView(ConfigView):
        """
        self.sources = list(sources)
        self.name = ROOT_NAME
+        self.redactions = set()

    def add(self, obj):
        self.sources.append(ConfigSource.of(obj))
@@ -391,12 +467,24 @@ class RootView(ConfigView):
        return ((dict(s), s) for s in self.sources)

    def clear(self):
-        """Remove all sources from this configuration."""
+        """Remove all sources (and redactions) from this
+        configuration.
+        """
        del self.sources[:]
+        self.redactions.clear()

    def root(self):
        return self

+    def set_redaction(self, path, flag):
+        if flag:
+            self.redactions.add(path)
+        elif path in self.redactions:
+            self.redactions.remove(path)
+
+    def get_redactions(self):
+        return self.redactions
+

 class Subview(ConfigView):
    """A subview accessed via a subscript of a parent view."""
@@ -414,11 +502,13 @@ class Subview(ConfigView):
            if not isinstance(self.key, int):
                self.name += '.'
        if isinstance(self.key, int):
-            self.name += '#{0}'.format(self.key)
-        elif isinstance(self.key, BASESTRING):
-            self.name += '{0}'.format(self.key)
+            self.name += u'#{0}'.format(self.key)
+        elif isinstance(self.key, bytes):
+            self.name += self.key.decode('utf-8')
+        elif isinstance(self.key, STRING):
+            self.name += self.key
        else:
-            self.name += '{0}'.format(repr(self.key))
+            self.name += repr(self.key)

    def resolve(self):
        for collection, source in self.parent.resolve():
@@ -433,7 +523,7 @@ class Subview(ConfigView):
            except TypeError:
                # Not subscriptable.
                raise ConfigTypeError(
-                    "{0} must be a collection, not {1}".format(
+                    u"{0} must be a collection, not {1}".format(
                        self.parent.name, type(collection).__name__
                    )
                )
@@ -448,6 +538,13 @@ class Subview(ConfigView):
    def root(self):
        return self.parent.root()

+    def set_redaction(self, path, flag):
+        self.parent.set_redaction((self.key,) + path, flag)
+
+    def get_redactions(self):
+        return (kp[1:] for kp in self.parent.get_redactions()
+                if kp and kp[0] == self.key)
+

 # Config file paths, including platform-specific paths and in-package
 # defaults.
@@ -536,7 +633,7 @@ class Loader(yaml.SafeLoader):
        else:
            raise yaml.constructor.ConstructorError(
                None, None,
-                'expected a mapping node, but found %s' % node.id,
+                u'expected a mapping node, but found %s' % node.id,
                node.start_mark
            )

@@ -547,7 +644,7 @@ class Loader(yaml.SafeLoader):
                hash(key)
            except TypeError as exc:
                raise yaml.constructor.ConstructorError(
-                    'while constructing a mapping',
+                    u'while constructing a mapping',
                    node.start_mark, 'found unacceptable key (%s)' % exc,
                    key_node.start_mark
                )
@@ -595,11 +692,11 @@ class Dumper(yaml.SafeDumper):
        for item_key, item_value in mapping:
            node_key = self.represent_data(item_key)
            node_value = self.represent_data(item_value)
-            if not (isinstance(node_key, yaml.ScalarNode)
-                    and not node_key.style):
+            if not (isinstance(node_key, yaml.ScalarNode) and
+                    not node_key.style):
                best_style = False
-            if not (isinstance(node_value, yaml.ScalarNode)
-                    and not node_value.style):
+            if not (isinstance(node_value, yaml.ScalarNode) and
+                    not node_value.style):
                best_style = False
            value.append((node_key, node_value))
        if flow_style is None:
@@ -625,9 +722,9 @@ class Dumper(yaml.SafeDumper):
        """Represent bool as 'yes' or 'no' instead of 'true' or 'false'.
        """
        if data:
-            value = 'yes'
+            value = u'yes'
        else:
-            value = 'no'
+            value = u'no'
        return self.represent_scalar('tag:yaml.org,2002:bool', value)

    def represent_none(self, data):
@@ -752,7 +849,7 @@ class Configuration(RootView):
            appdir = os.environ[self._env_var]
            appdir = os.path.abspath(os.path.expanduser(appdir))
            if os.path.isfile(appdir):
-                raise ConfigError('{0} must be a directory'.format(
+                raise ConfigError(u'{0} must be a directory'.format(
                    self._env_var
                ))

@@ -776,7 +873,7 @@ class Configuration(RootView):
        filename = os.path.abspath(filename)
        self.set(ConfigSource(load_yaml(filename), filename))

-    def dump(self, full=True):
+    def dump(self, full=True, redact=False):
        """Dump the Configuration object to a YAML file.

        The order of the keys is determined from the default
@@ -788,13 +885,17 @@ class Configuration(RootView):
        :type filename:   unicode
        :param full:      Dump settings that don't differ from the defaults
                          as well
+        :param redact:    Remove sensitive information (views with the `redact`
+                          flag set) from the output
        """
        if full:
-            out_dict = self.flatten()
+            out_dict = self.flatten(redact=redact)
        else:
            # Exclude defaults when flattening.
            sources = [s for s in self.sources if not s.default]
-            out_dict = RootView(sources).flatten()
+            temp_root = RootView(sources)
+            temp_root.redactions = self.redactions
+            out_dict = temp_root.flatten(redact=redact)

        yaml_out = yaml.dump(out_dict, Dumper=Dumper,
                             default_flow_style=None, indent=4,
@@ -806,7 +907,7 @@ class Configuration(RootView):
            if source.default:
                default_source = source
                break
-        if default_source:
+        if default_source and default_source.filename:
            with open(default_source.filename, 'r') as fp:
                default_data = fp.read()
            yaml_out = restore_yaml_comments(yaml_out, default_data)
@@ -853,7 +954,7 @@ class LazyConfig(Configuration):

    def clear(self):
        """Remove all sources from this configuration."""
-        del self.sources[:]
+        super(LazyConfig, self).clear()
        self._lazy_suffix = []
        self._lazy_prefix = []

@@ -870,7 +971,7 @@ should be raised when the value is missing.
 class Template(object):
    """A value template for configuration fields.

-    The template works like a type and instructs Confit about how to
+    The template works like a type and instructs Confuse about how to
    interpret a deserialized YAML value. This includes type conversions,
    providing a default value, and validating for errors. For example, a
    filepath type might expand tildes and check that the file exists.
@@ -901,7 +1002,7 @@ class Template(object):
            return self.convert(value, view)
        elif self.default is REQUIRED:
            # Missing required value. This is an error.
-            raise NotFoundError("{0} not found".format(view.name))
+            raise NotFoundError(u"{0} not found".format(view.name))
        else:
            # Missing value, but not required.
            return self.default
@@ -926,7 +1027,7 @@ class Template(object):
        """
        exc_class = ConfigTypeError if type_error else ConfigValueError
        raise exc_class(
-            '{0}: {1}'.format(view.name, message)
+            u'{0}: {1}'.format(view.name, message)
        )

    def __repr__(self):
@@ -947,7 +1048,7 @@ class Integer(Template):
        elif isinstance(value, float):
            return int(value)
        else:
-            self.fail('must be a number', view, True)
+            self.fail(u'must be a number', view, True)


 class Number(Template):
@@ -960,7 +1061,7 @@ class Number(Template):
            return value
        else:
            self.fail(
-                'must be numeric, not {0}'.format(type(value).__name__),
+                u'must be numeric, not {0}'.format(type(value).__name__),
                view,
                True
            )
@@ -1005,18 +1106,29 @@ class String(Template):
        if pattern:
            self.regex = re.compile(pattern)

+    def __repr__(self):
+        args = []
+
+        if self.default is not REQUIRED:
+            args.append(repr(self.default))
+
+        if self.pattern is not None:
+            args.append('pattern=' + repr(self.pattern))
+
+        return 'String({0})'.format(', '.join(args))
+
    def convert(self, value, view):
        """Check that the value is a string and matches the pattern.
        """
        if isinstance(value, BASESTRING):
            if self.pattern and not self.regex.match(value):
                self.fail(
-                    "must match the pattern {0}".format(self.pattern),
+                    u"must match the pattern {0}".format(self.pattern),
                    view
                )
            return value
        else:
-            self.fail('must be a string', view, True)
+            self.fail(u'must be a string', view, True)


 class Choice(Template):
@@ -1037,7 +1149,7 @@ class Choice(Template):
        """
        if value not in self.choices:
            self.fail(
-                'must be one of {0}, not {1}'.format(
+                u'must be one of {0}, not {1}'.format(
                    repr(list(self.choices)), repr(value)
                ),
                view
@@ -1052,6 +1164,67 @@ class Choice(Template):
        return 'Choice({0!r})'.format(self.choices)


+class OneOf(Template):
+    """A template that permits values complying to one of the given templates.
+    """
+    def __init__(self, allowed, default=REQUIRED):
+        super(OneOf, self).__init__(default)
+        self.allowed = list(allowed)
+
+    def __repr__(self):
+        args = []
+
+        if self.allowed is not None:
+            args.append('allowed=' + repr(self.allowed))
+
+        if self.default is not REQUIRED:
+            args.append(repr(self.default))
+
+        return 'OneOf({0})'.format(', '.join(args))
+
+    def value(self, view, template):
+        self.template = template
+        return super(OneOf, self).value(view, template)
+
+    def convert(self, value, view):
+        """Ensure that the value follows at least one template.
+        """
+        is_mapping = isinstance(self.template, MappingTemplate)
+
+        for candidate in self.allowed:
+            try:
+                if is_mapping:
+                    if isinstance(candidate, Filename) and \
+                            candidate.relative_to:
+                        next_template = candidate.template_with_relatives(
+                            view,
+                            self.template
+                        )
+
+                        next_template.subtemplates[view.key] = as_template(
+                            candidate
+                        )
+                    else:
+                        next_template = MappingTemplate({view.key: candidate})
+
+                    return view.parent.get(next_template)[view.key]
+                else:
+                    return view.get(candidate)
+            except ConfigTemplateError:
+                raise
+            except ConfigError:
+                pass
+            except ValueError as exc:
+                raise ConfigTemplateError(exc)
+
+        self.fail(
+            u'must be one of {0}, not {1}'.format(
+                repr(self.allowed), repr(value)
+            ),
+            view
+        )
+
+
 class StrSeq(Template):
    """A template for values that are lists of strings.

@@ -1070,7 +1243,7 @@ class StrSeq(Template):

    def convert(self, value, view):
        if isinstance(value, bytes):
-            value = value.decode('utf8', 'ignore')
+            value = value.decode('utf-8', 'ignore')

        if isinstance(value, STRING):
            if self.split:
@@ -1081,17 +1254,17 @@ class StrSeq(Template):
        try:
            value = list(value)
        except TypeError:
-            self.fail('must be a whitespace-separated string or a list',
+            self.fail(u'must be a whitespace-separated string or a list',
                      view, True)

        def convert(x):
-            if isinstance(x, unicode):
+            if isinstance(x, STRING):
                return x
-            elif isinstance(x, BASESTRING):
-                return x.decode('utf8', 'ignore')
+            elif isinstance(x, bytes):
+                return x.decode('utf-8', 'ignore')
            else:
-                self.fail('must be a list of strings', view, True)
-        return map(convert, value)
+                self.fail(u'must be a list of strings', view, True)
+        return list(map(convert, value))


 class Filename(Template):
@@ -1107,7 +1280,7 @@ class Filename(Template):
    """
    def __init__(self, default=REQUIRED, cwd=None, relative_to=None,
                 in_app_dir=False):
-        """ `relative_to` is the name of a sibling value that is
+        """`relative_to` is the name of a sibling value that is
        being validated at the same time.

        `in_app_dir` indicates whether the path should be resolved
@@ -1140,19 +1313,19 @@ class Filename(Template):
        if not isinstance(template, (collections.Mapping, MappingTemplate)):
            # disallow config.get(Filename(relative_to='foo'))
            raise ConfigTemplateError(
-                'relative_to may only be used when getting multiple values.'
+                u'relative_to may only be used when getting multiple values.'
            )

        elif self.relative_to == view.key:
            raise ConfigTemplateError(
-                '{0} is relative to itself'.format(view.name)
+                u'{0} is relative to itself'.format(view.name)
            )

        elif self.relative_to not in view.parent.keys():
            # self.relative_to is not in the config
            self.fail(
                (
-                    'needs sibling value "{0}" to expand relative path'
+                    u'needs sibling value "{0}" to expand relative path'
                ).format(self.relative_to),
                view
            )
@@ -1174,12 +1347,12 @@ class Filename(Template):
                if next_relative in template.subtemplates:
                    # we encountered this config key previously
                    raise ConfigTemplateError((
-                        '{0} and {1} are recursively relative'
+                        u'{0} and {1} are recursively relative'
                    ).format(view.name, self.relative_to))
                else:
                    raise ConfigTemplateError((
-                        'missing template for {0}, needed to expand {1}\'s' +
-                        'relative path'
+                        u'missing template for {0}, needed to expand {1}\'s' +
+                        u'relative path'
                    ).format(self.relative_to, view.name))

            next_template.subtemplates[next_relative] = rel_to_template
@@ -1191,7 +1364,7 @@ class Filename(Template):
        path, source = view.first()
        if not isinstance(path, BASESTRING):
            self.fail(
-                'must be a filename, not {0}'.format(type(path).__name__),
+                u'must be a filename, not {0}'.format(type(path).__name__),
                view,
                True
            )
@@ -1229,7 +1402,7 @@ class TypeTemplate(Template):
    def convert(self, value, view):
        if not isinstance(value, self.typ):
            self.fail(
-                'must be a {0}, not {1}'.format(
+                u'must be a {0}, not {1}'.format(
                    self.typ.__name__,
                    type(value).__name__,
                ),
@@ -1267,6 +1440,11 @@ def as_template(value):
        return String()
    elif isinstance(value, BASESTRING):
        return String(value)
+    elif isinstance(value, set):
+        # convert to list to avoid hash related problems
+        return Choice(list(value))
+    elif isinstance(value, list):
+        return OneOf(value)
    elif value is float:
        return Number()
    elif value is None:
@@ -1278,4 +1456,4 @@ def as_template(value):
    elif isinstance(value, type):
        return TypeTemplate(value)
    else:
-        raise ValueError('cannot convert to template: {0!r}'.format(value))
+        raise ValueError(u'cannot convert to template: {0!r}'.format(value))
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -12,6 +13,8 @@
 # The above copyright notice and this permission notice shall be
 # included in all copies or substantial portions of the Software.

+from __future__ import division, absolute_import, print_function
+
 from enum import Enum


@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -25,12 +26,15 @@ library: unknown symbols are left intact.
 This is sort of like a tiny, horrible degeneration of a real templating
 engine like Jinja2 or Mustache.
 """
-from __future__ import print_function
+
+from __future__ import division, absolute_import, print_function

 import re
 import ast
 import dis
 import types
+import sys
+import six

 SYMBOL_DELIM = u'$'
 FUNC_DELIM = u'%'
@@ -70,13 +74,13 @@ def ex_literal(val):
    """
    if val is None:
        return ast.Name('None', ast.Load())
-    elif isinstance(val, (int, float, long)):
+    elif isinstance(val, six.integer_types):
        return ast.Num(val)
    elif isinstance(val, bool):
-        return ast.Name(str(val), ast.Load())
-    elif isinstance(val, basestring):
+        return ast.Name(bytes(val), ast.Load())
+    elif isinstance(val, six.string_types):
        return ast.Str(val)
-    raise TypeError('no literal for {0}'.format(type(val)))
+    raise TypeError(u'no literal for {0}'.format(type(val)))


 def ex_varassign(name, expr):
@@ -93,7 +97,7 @@ def ex_call(func, args):
    function may be an expression or the name of a function. Each
    argument may be an expression or a value to be used as a literal.
    """
-    if isinstance(func, basestring):
+    if isinstance(func, six.string_types):
        func = ex_rvalue(func)

    args = list(args)
@@ -101,7 +105,10 @@ def ex_call(func, args):
        if not isinstance(args[i], ast.expr):
            args[i] = ex_literal(args[i])

-    return ast.Call(func, args, [], None, None)
+    if sys.version_info[:2] < (3, 5):
+        return ast.Call(func, args, [], None, None)
+    else:
+        return ast.Call(func, args, [])


 def compile_func(arg_names, statements, name='_the_func', debug=False):
@@ -109,16 +116,31 @@ def compile_func(arg_names, statements, name='_the_func', debug=False):
    the resulting Python function. If `debug`, then print out the
    bytecode of the compiled function.
    """
-    func_def = ast.FunctionDef(
-        name,
-        ast.arguments(
-            [ast.Name(n, ast.Param()) for n in arg_names],
-            None, None,
-            [ex_literal(None) for _ in arg_names],
-        ),
-        statements,
-        [],
-    )
+    if six.PY2:
+        func_def = ast.FunctionDef(
+            name=name.encode('utf-8'),
+            args=ast.arguments(
+                args=[ast.Name(n, ast.Param()) for n in arg_names],
+                vararg=None,
+                kwarg=None,
+                defaults=[ex_literal(None) for _ in arg_names],
+            ),
+            body=statements,
+            decorator_list=[],
+        )
+    else:
+        func_def = ast.FunctionDef(
+            name=name,
+            args=ast.arguments(
+                args=[ast.arg(arg=n, annotation=None) for n in arg_names],
+                kwonlyargs=[],
+                kw_defaults=[],
+                defaults=[ex_literal(None) for _ in arg_names],
+            ),
+            body=statements,
+            decorator_list=[],
+        )
+
    mod = ast.Module([func_def])
    ast.fix_missing_locations(mod)

@@ -132,7 +154,7 @@ def compile_func(arg_names, statements, name='_the_func', debug=False):
                dis.dis(const)

    the_locals = {}
-    exec prog in {}, the_locals
+    exec(prog, {}, the_locals)
    return the_locals[name]


@@ -160,8 +182,12 @@ class Symbol(object):

    def translate(self):
        """Compile the variable lookup."""
-        expr = ex_rvalue(VARIABLE_PREFIX + self.ident.encode('utf8'))
-        return [expr], set([self.ident.encode('utf8')]), set()
+        if six.PY2:
+            ident = self.ident.encode('utf-8')
+        else:
+            ident = self.ident
+        expr = ex_rvalue(VARIABLE_PREFIX + ident)
+        return [expr], set([ident]), set()


 class Call(object):
@@ -186,15 +212,19 @@ class Call(object):
            except Exception as exc:
                # Function raised exception! Maybe inlining the name of
                # the exception will help debug.
-                return u'<%s>' % unicode(exc)
-            return unicode(out)
+                return u'<%s>' % six.text_type(exc)
+            return six.text_type(out)
        else:
            return self.original

    def translate(self):
        """Compile the function call."""
        varnames = set()
-        funcnames = set([self.ident.encode('utf8')])
+        if six.PY2:
+            ident = self.ident.encode('utf-8')
+        else:
+            ident = self.ident
+        funcnames = set([ident])

        arg_exprs = []
        for arg in self.args:
@@ -209,14 +239,14 @@ class Call(object):
                [ex_call(
                    'map',
                    [
-                        ex_rvalue('unicode'),
+                        ex_rvalue(six.text_type.__name__),
                        ast.List(subexprs, ast.Load()),
                    ]
                )],
            ))

        subexpr_call = ex_call(
-            FUNCTION_PREFIX + self.ident.encode('utf8'),
+            FUNCTION_PREFIX + ident,
            arg_exprs
        )
        return [subexpr_call], varnames, funcnames
@@ -238,11 +268,11 @@ class Expression(object):
        """
        out = []
        for part in self.parts:
-            if isinstance(part, basestring):
+            if isinstance(part, six.string_types):
                out.append(part)
            else:
                out.append(part.evaluate(env))
-        return u''.join(map(unicode, out))
+        return u''.join(map(six.text_type, out))

    def translate(self):
        """Compile the expression to a list of Python AST expressions, a
@@ -252,7 +282,7 @@ class Expression(object):
        varnames = set()
        funcnames = set()
        for part in self.parts:
-            if isinstance(part, basestring):
+            if isinstance(part, six.string_types):
                expressions.append(ex_literal(part))
            else:
                e, v, f = part.translate()
@@ -281,16 +311,24 @@ class Parser(object):
    replaced with a real, accepted parsing technique (PEG, parser
    generator, etc.).
    """
-    def __init__(self, string):
+    def __init__(self, string, in_argument=False):
+        """ Create a new parser.
+        :param in_arguments: boolean that indicates the parser is to be
+        used for parsing function arguments, ie. considering commas
+        (`ARG_SEP`) a special character
+        """
        self.string = string
+        self.in_argument = in_argument
        self.pos = 0
        self.parts = []

    # Common parsing resources.
    special_chars = (SYMBOL_DELIM, FUNC_DELIM, GROUP_OPEN, GROUP_CLOSE,
-                     ARG_SEP, ESCAPE_CHAR)
-    special_char_re = re.compile(ur'[%s]|$' %
+                     ESCAPE_CHAR)
+    special_char_re = re.compile(r'[%s]|$' %
                                 u''.join(re.escape(c) for c in special_chars))
+    escapable_chars = (SYMBOL_DELIM, FUNC_DELIM, GROUP_CLOSE, ARG_SEP)
+    terminator_chars = (GROUP_CLOSE,)

    def parse_expression(self):
        """Parse a template expression starting at ``pos``. Resulting
@@ -298,17 +336,27 @@ class Parser(object):
        the ``parts`` field, a list.  The ``pos`` field is updated to be
        the next character after the expression.
        """
+        # Append comma (ARG_SEP) to the list of special characters only when
+        # parsing function arguments.
+        extra_special_chars = ()
+        special_char_re = self.special_char_re
+        if self.in_argument:
+            extra_special_chars = (ARG_SEP,)
+            special_char_re = re.compile(
+                r'[%s]|$' % u''.join(re.escape(c) for c in
+                                     self.special_chars + extra_special_chars))
+
        text_parts = []

        while self.pos < len(self.string):
            char = self.string[self.pos]

-            if char not in self.special_chars:
+            if char not in self.special_chars + extra_special_chars:
                # A non-special character. Skip to the next special
                # character, treating the interstice as literal text.
                next_pos = (
-                    self.special_char_re.search(self.string[self.pos:]).start()
-                    + self.pos
+                    special_char_re.search(
+                        self.string[self.pos:]).start() + self.pos
                )
                text_parts.append(self.string[self.pos:next_pos])
                self.pos = next_pos
@@ -318,14 +366,14 @@ class Parser(object):
                # The last character can never begin a structure, so we
                # just interpret it as a literal character (unless it
                # terminates the expression, as with , and }).
-                if char not in (GROUP_CLOSE, ARG_SEP):
+                if char not in self.terminator_chars + extra_special_chars:
                    text_parts.append(char)
                    self.pos += 1
                break

            next_char = self.string[self.pos + 1]
-            if char == ESCAPE_CHAR and next_char in \
-                    (SYMBOL_DELIM, FUNC_DELIM, GROUP_CLOSE, ARG_SEP):
+            if char == ESCAPE_CHAR and next_char in (self.escapable_chars +
+                                                     extra_special_chars):
                # An escaped special character ($$, $}, etc.). Note that
                # ${ is not an escape sequence: this is ambiguous with
                # the start of a symbol and it's not necessary (just
@@ -345,7 +393,7 @@ class Parser(object):
            elif char == FUNC_DELIM:
                # Parse a function call.
                self.parse_call()
-            elif char in (GROUP_CLOSE, ARG_SEP):
+            elif char in self.terminator_chars + extra_special_chars:
                # Template terminated.
                break
            elif char == GROUP_OPEN:
@@ -453,7 +501,7 @@ class Parser(object):
        expressions = []

        while self.pos < len(self.string):
-            subparser = Parser(self.string[self.pos:])
+            subparser = Parser(self.string[self.pos:], in_argument=True)
            subparser.parse_expression()

            # Extract and advance past the parsed expression.
@@ -477,7 +525,7 @@ class Parser(object):
        Updates ``pos``.
        """
        remainder = self.string[self.pos:]
-        ident = re.match(ur'\w*', remainder).group(0)
+        ident = re.match(r'\w*', remainder).group(0)
        self.pos += len(ident)
        return ident

@@ -524,6 +572,7 @@ class Template(object):
            res = self.compiled(values, functions)
        except:  # Handle any exceptions thrown by compiled version.
            res = self.interpret(values, functions)
+
        return res

    def translate(self):
@@ -532,9 +581,9 @@ class Template(object):

        argnames = []
        for varname in varnames:
-            argnames.append(VARIABLE_PREFIX.encode('utf8') + varname)
+            argnames.append(VARIABLE_PREFIX + varname)
        for funcname in funcnames:
-            argnames.append(FUNCTION_PREFIX.encode('utf8') + funcname)
+            argnames.append(FUNCTION_PREFIX + funcname)

        func = compile_func(
            argnames,
@@ -559,7 +608,7 @@ if __name__ == '__main__':
    import timeit
    _tmpl = Template(u'foo $bar %baz{foozle $bar barzle} $bar')
    _vars = {'bar': 'qux'}
-    _funcs = {'baz': unicode.upper}
+    _funcs = {'baz': six.text_type.upper}
    interp_time = timeit.timeit('_tmpl.interpret(_vars, _funcs)',
                                'from __main__ import _tmpl, _vars, _funcs',
                                number=10000)
@@ -568,4 +617,4 @@ if __name__ == '__main__':
                              'from __main__ import _tmpl, _vars, _funcs',
                              number=10000)
    print(comp_time)
-    print('Speedup:', interp_time / comp_time)
+    print(u'Speedup:', interp_time / comp_time)
@@ -0,0 +1,86 @@
+# -*- coding: utf-8 -*-
+# This file is part of beets.
+# Copyright 2016, Adrian Sampson.
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+"""Simple library to work out if a file is hidden on different platforms."""
+from __future__ import division, absolute_import, print_function
+
+import os
+import stat
+import ctypes
+import sys
+import beets.util
+
+
+def _is_hidden_osx(path):
+    """Return whether or not a file is hidden on OS X.
+
+    This uses os.lstat to work out if a file has the "hidden" flag.
+    """
+    file_stat = os.lstat(beets.util.syspath(path))
+
+    if hasattr(file_stat, 'st_flags') and hasattr(stat, 'UF_HIDDEN'):
+        return bool(file_stat.st_flags & stat.UF_HIDDEN)
+    else:
+        return False
+
+
+def _is_hidden_win(path):
+    """Return whether or not a file is hidden on Windows.
+
+    This uses GetFileAttributes to work out if a file has the "hidden" flag
+    (FILE_ATTRIBUTE_HIDDEN).
+    """
+    # FILE_ATTRIBUTE_HIDDEN = 2 (0x2) from GetFileAttributes documentation.
+    hidden_mask = 2
+
+    # Retrieve the attributes for the file.
+    attrs = ctypes.windll.kernel32.GetFileAttributesW(beets.util.syspath(path))
+
+    # Ensure we have valid attribues and compare them against the mask.
+    return attrs >= 0 and attrs & hidden_mask
+
+
+def _is_hidden_dot(path):
+    """Return whether or not a file starts with a dot.
+
+    Files starting with a dot are seen as "hidden" files on Unix-based OSes.
+    """
+    return os.path.basename(path).startswith(b'.')
+
+
+def is_hidden(path):
+    """Return whether or not a file is hidden. `path` should be a
+    bytestring filename.
+
+    This method works differently depending on the platform it is called on.
+
+    On OS X, it uses both the result of `is_hidden_osx` and `is_hidden_dot` to
+    work out if a file is hidden.
+
+    On Windows, it uses the result of `is_hidden_win` to work out if a file is
+    hidden.
+
+    On any other operating systems (i.e. Linux), it uses `is_hidden_dot` to
+    work out if a file is hidden.
+    """
+    # Run platform specific functions depending on the platform
+    if sys.platform == 'darwin':
+        return _is_hidden_osx(path) or _is_hidden_dot(path)
+    elif sys.platform == 'win32':
+        return _is_hidden_win(path)
+    else:
+        return _is_hidden_dot(path)
+
+__all__ = ['is_hidden']
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -30,11 +31,13 @@ up a bottleneck stage by dividing its work among multiple threads.
 To do so, pass an iterable of coroutines to the Pipeline constructor
 in place of any single coroutine.
 """
-from __future__ import print_function

-import Queue
+from __future__ import division, absolute_import, print_function
+
+from six.moves import queue
 from threading import Thread, Lock
 import sys
+import six

 BUBBLE = '__PIPELINE_BUBBLE__'
 POISON = '__PIPELINE_POISON__'
@@ -61,7 +64,17 @@ def _invalidate_queue(q, val=None, sync=True):
        q.mutex.acquire()

    try:
-        q.maxsize = 0
+        # Originally, we set `maxsize` to 0 here, which is supposed to mean
+        # an unlimited queue size. However, there is a race condition since
+        # Python 3.2 when this attribute is changed while another thread is
+        # waiting in put()/get() due to a full/empty queue.
+        # Setting it to 2 is still hacky because Python does not give any
+        # guarantee what happens if Queue methods/attributes are overwritten
+        # when it is already in use. However, because of our dummy _put()
+        # and _get() methods, it provides a workaround to let the queue appear
+        # to be never empty or full.
+        # See issue https://github.com/beetbox/beets/issues/2078
+        q.maxsize = 2
        q._qsize = _qsize
        q._put = _put
        q._get = _get
@@ -73,13 +86,13 @@ def _invalidate_queue(q, val=None, sync=True):
            q.mutex.release()


-class CountedQueue(Queue.Queue):
+class CountedQueue(queue.Queue):
    """A queue that keeps track of the number of threads that are
    still feeding into it. The queue is poisoned when all threads are
    finished with the queue.
    """
    def __init__(self, maxsize=0):
-        Queue.Queue.__init__(self, maxsize)
+        queue.Queue.__init__(self, maxsize)
        self.nthreads = 0
        self.poisoned = False

@@ -246,7 +259,7 @@ class FirstPipelineThread(PipelineThread):

                # Get the value from the generator.
                try:
-                    msg = self.coro.next()
+                    msg = next(self.coro)
                except StopIteration:
                    break

@@ -279,7 +292,7 @@ class MiddlePipelineThread(PipelineThread):
    def run(self):
        try:
            # Prime the coroutine.
-            self.coro.next()
+            next(self.coro)

            while True:
                with self.abort_lock:
@@ -324,7 +337,7 @@ class LastPipelineThread(PipelineThread):

    def run(self):
        # Prime the coroutine.
-        self.coro.next()
+        next(self.coro)

        try:
            while True:
@@ -359,7 +372,7 @@ class Pipeline(object):
        be at least two stages.
        """
        if len(stages) < 2:
-            raise ValueError('pipeline must have at least two stages')
+            raise ValueError(u'pipeline must have at least two stages')
        self.stages = []
        for stage in stages:
            if isinstance(stage, (list, tuple)):
@@ -409,7 +422,7 @@ class Pipeline(object):
        try:
            # Using a timeout allows us to receive KeyboardInterrupt
            # exceptions during the join().
-            while threads[-1].isAlive():
+            while threads[-1].is_alive():
                threads[-1].join(1)

        except:
@@ -429,7 +442,7 @@ class Pipeline(object):
            exc_info = thread.exc_info
            if exc_info:
                # Make the exception appear as it was raised originally.
-                raise exc_info[0], exc_info[1], exc_info[2]
+                six.reraise(exc_info[0], exc_info[1], exc_info[2])

    def pull(self):
        """Yield elements from the end of the pipeline. Runs the stages
@@ -442,7 +455,7 @@ class Pipeline(object):

        # "Prime" the coroutines.
        for coro in coros[1:]:
-            coro.next()
+            next(coro)

        # Begin the pipeline.
        for out in coros[0]:
@@ -464,14 +477,14 @@ if __name__ == '__main__':
    # in parallel.
    def produce():
        for i in range(5):
-            print('generating %i' % i)
+            print(u'generating %i' % i)
            time.sleep(1)
            yield i

    def work():
        num = yield
        while True:
-            print('processing %i' % num)
+            print(u'processing %i' % num)
            time.sleep(2)
            num = yield num * 2

@@ -479,7 +492,7 @@ if __name__ == '__main__':
        while True:
            num = yield
            time.sleep(1)
-            print('received %i' % num)
+            print(u'received %i' % num)

    ts_start = time.time()
    Pipeline([produce(), work(), consume()]).run_sequential()
@@ -488,22 +501,22 @@ if __name__ == '__main__':
    ts_par = time.time()
    Pipeline([produce(), (work(), work()), consume()]).run_parallel()
    ts_end = time.time()
-    print('Sequential time:', ts_seq - ts_start)
-    print('Parallel time:', ts_par - ts_seq)
-    print('Multiply-parallel time:', ts_end - ts_par)
+    print(u'Sequential time:', ts_seq - ts_start)
+    print(u'Parallel time:', ts_par - ts_seq)
+    print(u'Multiply-parallel time:', ts_end - ts_par)
    print()

    # Test a pipeline that raises an exception.
    def exc_produce():
        for i in range(10):
-            print('generating %i' % i)
+            print(u'generating %i' % i)
            time.sleep(1)
            yield i

    def exc_work():
        num = yield
        while True:
-            print('processing %i' % num)
+            print(u'processing %i' % num)
            time.sleep(3)
            if num == 3:
                raise Exception()
@@ -512,6 +525,6 @@ if __name__ == '__main__':
    def exc_consume():
        while True:
            num = yield
-            print('received %i' % num)
+            print(u'received %i' % num)

    Pipeline([exc_produce(), exc_work(), exc_consume()]).run_parallel(1)
@@ -1,5 +1,6 @@
+# -*- coding: utf-8 -*-
 # This file is part of beets.
-# Copyright 2013, Adrian Sampson.
+# Copyright 2016, Adrian Sampson.
 #
 # Permission is hereby granted, free of charge, to any person obtaining
 # a copy of this software and associated documentation files (the
@@ -15,6 +16,8 @@
 """A simple utility for constructing filesystem-like trees from beets
 libraries.
 """
+from __future__ import division, absolute_import, print_function
+
 from collections import namedtuple
 from beets import util

@@ -0,0 +1,4 @@
+try:
+    from .cjellyfish import *   # noqa
+except ImportError:
+    from ._jellyfish import *   # noqa
@@ -0,0 +1,488 @@
+import unicodedata
+from collections import defaultdict
+from .compat import _range, _zip_longest, _no_bytes_err
+from .porter import Stemmer
+
+
+def _normalize(s):
+    return unicodedata.normalize('NFKD', s)
+
+
+def levenshtein_distance(s1, s2):
+    if isinstance(s1, bytes) or isinstance(s2, bytes):
+        raise TypeError(_no_bytes_err)
+
+    if s1 == s2:
+        return 0
+    rows = len(s1)+1
+    cols = len(s2)+1
+
+    if not s1:
+        return cols-1
+    if not s2:
+        return rows-1
+
+    prev = None
+    cur = range(cols)
+    for r in _range(1, rows):
+        prev, cur = cur, [r] + [0]*(cols-1)
+        for c in _range(1, cols):
+            deletion = prev[c] + 1
+            insertion = cur[c-1] + 1
+            edit = prev[c-1] + (0 if s1[r-1] == s2[c-1] else 1)
+            cur[c] = min(edit, deletion, insertion)
+
+    return cur[-1]
+
+
+def _jaro_winkler(ying, yang, long_tolerance, winklerize):
+    if isinstance(ying, bytes) or isinstance(yang, bytes):
+        raise TypeError(_no_bytes_err)
+
+    ying_len = len(ying)
+    yang_len = len(yang)
+
+    if not ying_len or not yang_len:
+        return 0
+
+    min_len = max(ying_len, yang_len)
+    search_range = (min_len // 2) - 1
+    if search_range < 0:
+        search_range = 0
+
+    ying_flags = [False]*ying_len
+    yang_flags = [False]*yang_len
+
+    # looking only within search range, count & flag matched pairs
+    common_chars = 0
+    for i, ying_ch in enumerate(ying):
+        low = i - search_range if i > search_range else 0
+        hi = i + search_range if i + search_range < yang_len else yang_len - 1
+        for j in _range(low, hi+1):
+            if not yang_flags[j] and yang[j] == ying_ch:
+                ying_flags[i] = yang_flags[j] = True
+                common_chars += 1
+                break
+
+    # short circuit if no characters match
+    if not common_chars:
+        return 0
+
+    # count transpositions
+    k = trans_count = 0
+    for i, ying_f in enumerate(ying_flags):
+        if ying_f:
+            for j in _range(k, yang_len):
+                if yang_flags[j]:
+                    k = j + 1
+                    break
+            if ying[i] != yang[j]:
+                trans_count += 1
+    trans_count /= 2
+
+    # adjust for similarities in nonmatched characters
+    common_chars = float(common_chars)
+    weight = ((common_chars/ying_len + common_chars/yang_len +
+              (common_chars-trans_count) / common_chars)) / 3
+
+    # winkler modification: continue to boost if strings are similar
+    if winklerize and weight > 0.7 and ying_len > 3 and yang_len > 3:
+        # adjust for up to first 4 chars in common
+        j = min(min_len, 4)
+        i = 0
+        while i < j and ying[i] == yang[i] and ying[i]:
+            i += 1
+        if i:
+            weight += i * 0.1 * (1.0 - weight)
+
+        # optionally adjust for long strings
+        # after agreeing beginning chars, at least two or more must agree and
+        # agreed characters must be > half of remaining characters
+        if (long_tolerance and min_len > 4 and common_chars > i+1 and
+                2 * common_chars >= min_len + i):
+            weight += ((1.0 - weight) * (float(common_chars-i-1) / float(ying_len+yang_len-i*2+2)))
+
+    return weight
+
+
+def damerau_levenshtein_distance(s1, s2):
+    if isinstance(s1, bytes) or isinstance(s2, bytes):
+        raise TypeError(_no_bytes_err)
+
+    len1 = len(s1)
+    len2 = len(s2)
+    infinite = len1 + len2
+
+    # character array
+    da = defaultdict(int)
+
+    # distance matrix
+    score = [[0]*(len2+2) for x in _range(len1+2)]
+
+    score[0][0] = infinite
+    for i in _range(0, len1+1):
+        score[i+1][0] = infinite
+        score[i+1][1] = i
+    for i in _range(0, len2+1):
+        score[0][i+1] = infinite
+        score[1][i+1] = i
+
+    for i in _range(1, len1+1):
+        db = 0
+        for j in _range(1, len2+1):
+            i1 = da[s2[j-1]]
+            j1 = db
+            cost = 1
+            if s1[i-1] == s2[j-1]:
+                cost = 0
+                db = j
+
+            score[i+1][j+1] = min(score[i][j] + cost,
+                                  score[i+1][j] + 1,
+                                  score[i][j+1] + 1,
+                                  score[i1][j1] + (i-i1-1) + 1 + (j-j1-1))
+        da[s1[i-1]] = i
+
+    return score[len1+1][len2+1]
+
+
+def jaro_distance(s1, s2):
+    return _jaro_winkler(s1, s2, False, False)
+
+
+def jaro_winkler(s1, s2, long_tolerance=False):
+    return _jaro_winkler(s1, s2, long_tolerance, True)
+
+
+def soundex(s):
+    if not s:
+        return s
+    if isinstance(s, bytes):
+        raise TypeError(_no_bytes_err)
+
+    s = _normalize(s)
+
+    replacements = (('bfpv', '1'),
+                    ('cgjkqsxz', '2'),
+                    ('dt', '3'),
+                    ('l', '4'),
+                    ('mn', '5'),
+                    ('r', '6'))
+    result = [s[0]]
+    count = 1
+
+    # find would-be replacment for first character
+    for lset, sub in replacements:
+        if s[0].lower() in lset:
+            last = sub
+            break
+    else:
+        last = None
+
+    for letter in s[1:]:
+        for lset, sub in replacements:
+            if letter.lower() in lset:
+                if sub != last:
+                    result.append(sub)
+                    count += 1
+                last = sub
+                break
+        else:
+            last = None
+        if count == 4:
+            break
+
+    result += '0'*(4-count)
+    return ''.join(result)
+
+
+def hamming_distance(s1, s2):
+    if isinstance(s1, bytes) or isinstance(s2, bytes):
+        raise TypeError(_no_bytes_err)
+
+    # ensure length of s1 >= s2
+    if len(s2) > len(s1):
+        s1, s2 = s2, s1
+
+    # distance is difference in length + differing chars
+    distance = len(s1) - len(s2)
+    for i, c in enumerate(s2):
+        if c != s1[i]:
+            distance += 1
+
+    return distance
+
+
+def nysiis(s):
+    if isinstance(s, bytes):
+        raise TypeError(_no_bytes_err)
+    if not s:
+        return ''
+
+    s = s.upper()
+    key = []
+
+    # step 1 - prefixes
+    if s.startswith('MAC'):
+        s = 'MCC' + s[3:]
+    elif s.startswith('KN'):
+        s = s[1:]
+    elif s.startswith('K'):
+        s = 'C' + s[1:]
+    elif s.startswith(('PH', 'PF')):
+        s = 'FF' + s[2:]
+    elif s.startswith('SCH'):
+        s = 'SSS' + s[3:]
+
+    # step 2 - suffixes
+    if s.endswith(('IE', 'EE')):
+        s = s[:-2] + 'Y'
+    elif s.endswith(('DT', 'RT', 'RD', 'NT', 'ND')):
+        s = s[:-2] + 'D'
+
+    # step 3 - first character of key comes from name
+    key.append(s[0])
+
+    # step 4 - translate remaining chars
+    i = 1
+    len_s = len(s)
+    while i < len_s:
+        ch = s[i]
+        if ch == 'E' and i+1 < len_s and s[i+1] == 'V':
+            ch = 'AF'
+            i += 1
+        elif ch in 'AEIOU':
+            ch = 'A'
+        elif ch == 'Q':
+            ch = 'G'
+        elif ch == 'Z':
+            ch = 'S'
+        elif ch == 'M':
+            ch = 'N'
+        elif ch == 'K':
+            if i+1 < len(s) and s[i+1] == 'N':
+                ch = 'N'
+            else:
+                ch = 'C'
+        elif ch == 'S' and s[i+1:i+3] == 'CH':
+            ch = 'SS'
+            i += 2
+        elif ch == 'P' and i+1 < len(s) and s[i+1] == 'H':
+            ch = 'F'
+            i += 1
+        elif ch == 'H' and (s[i-1] not in 'AEIOU' or (i+1 < len(s) and s[i+1] not in 'AEIOU')):
+            if s[i-1] in 'AEIOU':
+                ch = 'A'
+            else:
+                ch = s[i-1]
+        elif ch == 'W' and s[i-1] in 'AEIOU':
+            ch = s[i-1]
+
+        if ch[-1] != key[-1][-1]:
+            key.append(ch)
+
+        i += 1
+
+    key = ''.join(key)
+
+    # step 5 - remove trailing S
+    if key.endswith('S') and key != 'S':
+        key = key[:-1]
+
+    # step 6 - replace AY w/ Y
+    if key.endswith('AY'):
+        key = key[:-2] + 'Y'
+
+    # step 7 - remove trailing A
+    if key.endswith('A') and key != 'A':
+        key = key[:-1]
+
+    # step 8 was already done
+
+    return key
+
+
+def match_rating_codex(s):
+    if isinstance(s, bytes):
+        raise TypeError(_no_bytes_err)
+    s = s.upper()
+    codex = []
+
+    prev = None
+    for i, c in enumerate(s):
+        # not a space OR
+        # starting character & vowel
+        # or consonant not preceded by same consonant
+        if (c != ' ' and (i == 0 and c in 'AEIOU') or (c not in 'AEIOU' and c != prev)):
+            codex.append(c)
+
+        prev = c
+
+    # just use first/last 3
+    if len(codex) > 6:
+        return ''.join(codex[:3]+codex[-3:])
+    else:
+        return ''.join(codex)
+
+
+def match_rating_comparison(s1, s2):
+    codex1 = match_rating_codex(s1)
+    codex2 = match_rating_codex(s2)
+    len1 = len(codex1)
+    len2 = len(codex2)
+    res1 = []
+    res2 = []
+
+    # length differs by 3 or more, no result
+    if abs(len1-len2) >= 3:
+        return None
+
+    # get minimum rating based on sums of codexes
+    lensum = len1 + len2
+    if lensum <= 4:
+        min_rating = 5
+    elif lensum <= 7:
+        min_rating = 4
+    elif lensum <= 11:
+        min_rating = 3
+    else:
+        min_rating = 2
+
+    # strip off common prefixes
+    for c1, c2 in _zip_longest(codex1, codex2):
+        if c1 != c2:
+            if c1:
+                res1.append(c1)
+            if c2:
+                res2.append(c2)
+
+    unmatched_count1 = unmatched_count2 = 0
+    for c1, c2 in _zip_longest(reversed(res1), reversed(res2)):
+        if c1 != c2:
+            if c1:
+                unmatched_count1 += 1
+            if c2:
+                unmatched_count2 += 1
+
+    return (6 - max(unmatched_count1, unmatched_count2)) >= min_rating
+
+
+def metaphone(s):
+    if isinstance(s, bytes):
+        raise TypeError(_no_bytes_err)
+
+    result = []
+
+    s = _normalize(s.lower())
+
+    # skip first character if s starts with these
+    if s.startswith(('kn', 'gn', 'pn', 'ac', 'wr', 'ae')):
+        s = s[1:]
+
+    i = 0
+
+    while i < len(s):
+        c = s[i]
+        next = s[i+1] if i < len(s)-1 else '*****'
+        nextnext = s[i+2] if i < len(s)-2 else '*****'
+
+        # skip doubles except for cc
+        if c == next and c != 'c':
+            i += 1
+            continue
+
+        if c in 'aeiou':
+            if i == 0 or s[i-1] == ' ':
+                result.append(c)
+        elif c == 'b':
+            if (not (i != 0 and s[i-1] == 'm')) or next:
+                result.append('b')
+        elif c == 'c':
+            if next == 'i' and nextnext == 'a' or next == 'h':
+                result.append('x')
+                i += 1
+            elif next in 'iey':
+                result.append('s')
+                i += 1
+            else:
+                result.append('k')
+        elif c == 'd':
+            if next == 'g' and nextnext in 'iey':
+                result.append('j')
+                i += 2
+            else:
+                result.append('t')
+        elif c in 'fjlmnr':
+            result.append(c)
+        elif c == 'g':
+            if next in 'iey':
+                result.append('j')
+            elif next not in 'hn':
+                result.append('k')
+            elif next == 'h' and nextnext and nextnext not in 'aeiou':
+                i += 1
+        elif c == 'h':
+            if i == 0 or next in 'aeiou' or s[i-1] not in 'aeiou':
+                result.append('h')
+        elif c == 'k':
+            if i == 0 or s[i-1] != 'c':
+                result.append('k')
+        elif c == 'p':
+            if next == 'h':
+                result.append('f')
+                i += 1
+            else:
+                result.append('p')
+        elif c == 'q':
+            result.append('k')
+        elif c == 's':
+            if next == 'h':
+                result.append('x')
+                i += 1
+            elif next == 'i' and nextnext in 'oa':
+                result.append('x')
+                i += 2
+            else:
+                result.append('s')
+        elif c == 't':
+            if next == 'i' and nextnext in 'oa':
+                result.append('x')
+            elif next == 'h':
+                result.append('0')
+                i += 1
+            elif next != 'c' or nextnext != 'h':
+                result.append('t')
+        elif c == 'v':
+            result.append('f')
+        elif c == 'w':
+            if i == 0 and next == 'h':
+                i += 1
+            if nextnext in 'aeiou' or nextnext == '*****':
+                result.append('w')
+        elif c == 'x':
+            if i == 0:
+                if next == 'h' or (next == 'i' and nextnext in 'oa'):
+                    result.append('x')
+                else:
+                    result.append('s')
+            else:
+                result.append('k')
+                result.append('s')
+        elif c == 'y':
+            if next in 'aeiou':
+                result.append('y')
+        elif c == 'z':
+            result.append('s')
+        elif c == ' ':
+            if len(result) > 0 and result[-1] != ' ':
+                result.append(' ')
+
+        i += 1
+
+    return ''.join(result).upper()
+
+
+def porter_stem(s):
+    if isinstance(s, bytes):
+        raise TypeError(_no_bytes_err)
+    return Stemmer(s).stem()
@@ -0,0 +1,13 @@
+import sys
+import itertools
+
+IS_PY3 = sys.version_info[0] == 3
+
+if IS_PY3:
+    _range = range
+    _zip_longest = itertools.zip_longest
+    _no_bytes_err = 'expected str, got bytes'
+else:
+    _range = xrange
+    _zip_longest = itertools.izip_longest
+    _no_bytes_err = 'expected unicode, got str'
@@ -0,0 +1,218 @@
+from .compat import _range
+
+_s2_options = {
+    'a': ((['a', 't', 'i', 'o', 'n', 'a', 'l'], ['a', 't', 'e']),
+          (['t', 'i', 'o', 'n', 'a', 'l'], ['t', 'i', 'o', 'n'])),
+    'c': ((['e', 'n', 'c', 'i'], ['e', 'n', 'c', 'e']),
+          (['a', 'n', 'c', 'i'], ['a', 'n', 'c', 'e']),),
+    'e': ((['i', 'z', 'e', 'r'], ['i', 'z', 'e']),),
+    'l': ((['b', 'l', 'i'], ['b', 'l', 'e']),
+          (['a', 'l', 'l', 'i'], ['a', 'l']),
+          (['e', 'n', 't', 'l', 'i'], ['e', 'n', 't']),
+          (['e', 'l', 'i'], ['e']),
+          (['o', 'u', 's', 'l', 'i'], ['o', 'u', 's']),),
+    'o': ((['i', 'z', 'a', 't', 'i', 'o', 'n'], ['i', 'z', 'e']),
+          (['a', 't', 'i', 'o', 'n'], ['a', 't', 'e']),
+          (['a', 't', 'o', 'r'], ['a', 't', 'e']),),
+    's': ((['a', 'l', 'i', 's', 'm'], ['a', 'l']),
+          (['i', 'v', 'e', 'n', 'e', 's', 's'], ['i', 'v', 'e']),
+          (['f', 'u', 'l', 'n', 'e', 's', 's'], ['f', 'u', 'l']),
+          (['o', 'u', 's', 'n', 'e', 's', 's'], ['o', 'u', 's']),),
+    't': ((['a', 'l', 'i', 't', 'i'], ['a', 'l']),
+          (['i', 'v', 'i', 't', 'i'], ['i', 'v', 'e']),
+          (['b', 'i', 'l', 'i', 't', 'i'], ['b', 'l', 'e']),),
+    'g': ((['l', 'o', 'g', 'i'], ['l', 'o', 'g']),),
+}
+
+
+_s3_options = {
+    'e': ((['i', 'c', 'a', 't', 'e'], ['i', 'c']),
+          (['a', 't', 'i', 'v', 'e'], []),
+          (['a', 'l', 'i', 'z', 'e'], ['a', 'l']),),
+    'i': ((['i', 'c', 'i', 't', 'i'], ['i', 'c']),),
+    'l': ((['i', 'c', 'a', 'l'], ['i', 'c']),
+          (['f', 'u', 'l'], []),),
+    's': ((['n', 'e', 's', 's'], []),),
+}
+
+_s4_endings = {
+    'a': (['a', 'l'],),
+    'c': (['a', 'n', 'c', 'e'], ['e', 'n', 'c', 'e']),
+    'e': (['e', 'r'],),
+    'i': (['i', 'c'],),
+    'l': (['a', 'b', 'l', 'e'], ['i', 'b', 'l', 'e']),
+    'n': (['a', 'n', 't'], ['e', 'm', 'e', 'n', 't'], ['m', 'e', 'n', 't'],
+          ['e', 'n', 't']),
+    # handle 'o' separately
+    's': (['i', 's', 'm'],),
+    't': (['a', 't', 'e'], ['i', 't', 'i']),
+    'u': (['o', 'u', 's'],),
+    'v': (['i', 'v', 'e'],),
+    'z': (['i', 'z', 'e'],),
+}
+
+
+class Stemmer(object):
+    def __init__(self, b):
+        self.b = list(b)
+        self.k = len(b)-1
+        self.j = 0
+
+    def cons(self, i):
+        """ True iff b[i] is a consonant """
+        if self.b[i] in 'aeiou':
+            return False
+        elif self.b[i] == 'y':
+            return True if i == 0 else not self.cons(i-1)
+        return True
+
+    def m(self):
+        n = i = 0
+        while True:
+            if i > self.j:
+                return n
+            if not self.cons(i):
+                break
+            i += 1
+        i += 1
+        while True:
+            while True:
+                if i > self.j:
+                    return n
+                if self.cons(i):
+                    break
+                i += 1
+
+            i += 1
+            n += 1
+
+            while True:
+                if i > self.j:
+                    return n
+                if not self.cons(i):
+                    break
+                i += 1
+            i += 1
+
+    def vowel_in_stem(self):
+        """ True iff 0...j contains vowel """
+        for i in _range(0, self.j+1):
+            if not self.cons(i):
+                return True
+        return False
+
+    def doublec(self, j):
+        """ True iff j, j-1 contains double consonant """
+        if j < 1 or self.b[j] != self.b[j-1]:
+            return False
+        return self.cons(j)
+
+    def cvc(self, i):
+        """ True iff i-2,i-1,i is consonent-vowel consonant
+        and if second c isn't w,x, or y.
+        used to restore e at end of short words like cave, love, hope, crime
+        """
+        if (i < 2 or not self.cons(i) or self.cons(i-1) or not self.cons(i-2) or
+                self.b[i] in 'wxy'):
+            return False
+        return True
+
+    def ends(self, s):
+        length = len(s)
+        """ True iff 0...k ends with string s """
+        res = (self.b[self.k-length+1:self.k+1] == s)
+        if res:
+            self.j = self.k - length
+        return res
+
+    def setto(self, s):
+        """ set j+1...k to string s, readjusting k """
+        length = len(s)
+        self.b[self.j+1:self.j+1+length] = s
+        self.k = self.j + length
+
+    def r(self, s):
+        if self.m() > 0:
+            self.setto(s)
+
+    def step1ab(self):
+        if self.b[self.k] == 's':
+            if self.ends(['s', 's', 'e', 's']):
+                self.k -= 2
+            elif self.ends(['i', 'e', 's']):
+                self.setto(['i'])
+            elif self.b[self.k-1] != 's':
+                self.k -= 1
+        if self.ends(['e', 'e', 'd']):
+            if self.m() > 0:
+                self.k -= 1
+        elif ((self.ends(['e', 'd']) or self.ends(['i', 'n', 'g'])) and
+              self.vowel_in_stem()):
+            self.k = self.j
+            if self.ends(['a', 't']):
+                self.setto(['a', 't', 'e'])
+            elif self.ends(['b', 'l']):
+                self.setto(['b', 'l', 'e'])
+            elif self.ends(['i', 'z']):
+                self.setto(['i', 'z', 'e'])
+            elif self.doublec(self.k):
+                self.k -= 1
+                if self.b[self.k] in 'lsz':
+                    self.k += 1
+            elif self.m() == 1 and self.cvc(self.k):
+                self.setto(['e'])
+
+    def step1c(self):
+        """ turn terminal y into i if there's a vowel in stem """
+        if self.ends(['y']) and self.vowel_in_stem():
+            self.b[self.k] = 'i'
+
+    def step2and3(self):
+        for end, repl in _s2_options.get(self.b[self.k-1], []):
+            if self.ends(end):
+                self.r(repl)
+                break
+
+        for end, repl in _s3_options.get(self.b[self.k], []):
+            if self.ends(end):
+                self.r(repl)
+                break
+
+    def step4(self):
+        ch = self.b[self.k-1]
+
+        if ch == 'o':
+            if not ((self.ends(['i', 'o', 'n']) and self.b[self.j] in 'st') or
+                    self.ends(['o', 'u'])):
+                return
+        else:
+            endings = _s4_endings.get(ch, [])
+            for end in endings:
+                if self.ends(end):
+                    break
+            else:
+                return
+
+        if self.m() > 1:
+            self.k = self.j
+
+    def step5(self):
+        self.j = self.k
+        if self.b[self.k] == 'e':
+            a = self.m()
+            if a > 1 or a == 1 and not self.cvc(self.k-1):
+                self.k -= 1
+        if self.b[self.k] == 'l' and self.doublec(self.k) and self.m() > 1:
+            self.k -= 1
+
+    def result(self):
+        return ''.join(self.b[:self.k+1])
+
+    def stem(self):
+        if self.k > 1:
+            self.step1ab()
+            self.step1c()
+            self.step2and3()
+            self.step4()
+            self.step5()
+        return self.result()
@@ -0,0 +1,213 @@
+# -*- coding: utf-8 -*-
+import sys
+if sys.version_info[0] < 3:
+    import unicodecsv as csv
+    open_kwargs = {}
+else:
+    import csv
+    open_kwargs = {'encoding': 'utf8'}
+import platform
+import pytest
+
+
+def assertAlmostEqual(a, b, places=3):
+    assert abs(a - b) < (0.1**places)
+
+
+if platform.python_implementation() == 'CPython':
+    implementations = ['python', 'c']
+else:
+    implementations = ['python']
+
+
+@pytest.fixture(params=implementations)
+def jf(request):
+    if request.param == 'python':
+        from jellyfish import _jellyfish as jf
+    else:
+        from jellyfish import cjellyfish as jf
+    return jf
+
+
+def _load_data(name):
+    with open('testdata/{}.csv'.format(name), **open_kwargs) as f:
+        for data in csv.reader(f):
+            yield data
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('jaro_winkler'), ids=str)
+def test_jaro_winkler(jf, s1, s2, value):
+    value = float(value)
+    assertAlmostEqual(jf.jaro_winkler(s1, s2), value, places=3)
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('jaro_distance'), ids=str)
+def test_jaro_distance(jf, s1, s2, value):
+    value = float(value)
+    assertAlmostEqual(jf.jaro_distance(s1, s2), value, places=3)
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('hamming'), ids=str)
+def test_hamming_distance(jf, s1, s2, value):
+    value = int(value)
+    assert jf.hamming_distance(s1, s2) == value
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('levenshtein'), ids=str)
+def test_levenshtein_distance(jf, s1, s2, value):
+    value = int(value)
+    assert jf.levenshtein_distance(s1, s2) == value
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('damerau_levenshtein'), ids=str)
+def test_damerau_levenshtein_distance(jf, s1, s2, value):
+    value = int(value)
+    assert jf.damerau_levenshtein_distance(s1, s2) == value
+
+
+@pytest.mark.parametrize("s1,code", _load_data('soundex'), ids=str)
+def test_soundex(jf, s1, code):
+    assert jf.soundex(s1) == code
+
+
+@pytest.mark.parametrize("s1,code", _load_data('metaphone'), ids=str)
+def test_metaphone(jf, s1, code):
+    assert jf.metaphone(s1) == code
+
+
+@pytest.mark.parametrize("s1,s2", _load_data('nysiis'), ids=str)
+def test_nysiis(jf, s1, s2):
+    assert jf.nysiis(s1) == s2
+
+
+@pytest.mark.parametrize("s1,s2", _load_data('match_rating_codex'), ids=str)
+def test_match_rating_codex(jf, s1, s2):
+    assert jf.match_rating_codex(s1) == s2
+
+
+@pytest.mark.parametrize("s1,s2,value", _load_data('match_rating_comparison'), ids=str)
+def test_match_rating_comparison(jf, s1, s2, value):
+    value = {'True': True, 'False': False, 'None': None}[value]
+    assert jf.match_rating_comparison(s1, s2) is value
+
+
+# use non-parameterized version for speed
+# @pytest.mark.parametrize("a,b", _load_data('porter'), ids=str)
+# def test_porter_stem(jf, a, b):
+#     assert jf.porter_stem(a) == b
+
+def test_porter_stem(jf):
+    with open('testdata/porter.csv', **open_kwargs) as f:
+        reader = csv.reader(f)
+        for (a, b) in reader:
+            assert jf.porter_stem(a) == b
+
+
+if platform.python_implementation() == 'CPython':
+    def test_match_rating_comparison_segfault():
+        import hashlib
+        from jellyfish import cjellyfish as jf
+        sha1s = [u'{}'.format(hashlib.sha1(str(v).encode('ascii')).hexdigest())
+                 for v in range(100)]
+        # this segfaulted on 0.1.2
+        assert [[jf.match_rating_comparison(h1, h2) for h1 in sha1s] for h2 in sha1s]
+
+
+    def test_damerau_levenshtein_unicode_segfault():
+        # unfortunate difference in behavior between Py & C versions
+        from jellyfish.cjellyfish import damerau_levenshtein_distance as c_dl
+        from jellyfish._jellyfish import damerau_levenshtein_distance as py_dl
+        s1 = u'mylifeoutdoors'
+        s2 = u'нахлыст'
+        with pytest.raises(ValueError):
+            c_dl(s1, s2)
+        with pytest.raises(ValueError):
+            c_dl(s2, s1)
+
+        assert py_dl(s1, s2) == 14
+        assert py_dl(s2, s1) == 14
+
+
+def test_jaro_winkler_long_tolerance(jf):
+    no_lt = jf.jaro_winkler(u'two long strings', u'two long stringz', long_tolerance=False)
+    with_lt = jf.jaro_winkler(u'two long strings', u'two long stringz', long_tolerance=True)
+    # make sure long_tolerance does something
+    assertAlmostEqual(no_lt, 0.975)
+    assertAlmostEqual(with_lt, 0.984)
+
+
+def test_damerau_levenshtein_distance_type(jf):
+    jf.damerau_levenshtein_distance(u'abc', u'abc')
+    with pytest.raises(TypeError) as exc:
+        jf.damerau_levenshtein_distance(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_levenshtein_distance_type(jf):
+    assert jf.levenshtein_distance(u'abc', u'abc') == 0
+    with pytest.raises(TypeError) as exc:
+        jf.levenshtein_distance(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_jaro_distance_type(jf):
+    assert jf.jaro_distance(u'abc', u'abc') == 1
+    with pytest.raises(TypeError) as exc:
+        jf.jaro_distance(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_jaro_winkler_type(jf):
+    assert jf.jaro_winkler(u'abc', u'abc') == 1
+    with pytest.raises(TypeError) as exc:
+        jf.jaro_winkler(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_mra_comparison_type(jf):
+    assert jf.match_rating_comparison(u'abc', u'abc') is True
+    with pytest.raises(TypeError) as exc:
+        jf.match_rating_comparison(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_hamming_type(jf):
+    assert jf.hamming_distance(u'abc', u'abc') == 0
+    with pytest.raises(TypeError) as exc:
+        jf.hamming_distance(b'abc', b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_soundex_type(jf):
+    assert jf.soundex(u'ABC') == 'A120'
+    with pytest.raises(TypeError) as exc:
+        jf.soundex(b'ABC')
+    assert 'expected' in str(exc.value)
+
+
+def test_metaphone_type(jf):
+    assert jf.metaphone(u'abc') == 'ABK'
+    with pytest.raises(TypeError) as exc:
+        jf.metaphone(b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_nysiis_type(jf):
+    assert jf.nysiis(u'abc') == 'ABC'
+    with pytest.raises(TypeError) as exc:
+        jf.nysiis(b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_mr_codex_type(jf):
+    assert jf.match_rating_codex(u'abc') == 'ABC'
+    with pytest.raises(TypeError) as exc:
+        jf.match_rating_codex(b'abc')
+    assert 'expected' in str(exc.value)
+
+
+def test_porter_type(jf):
+    assert jf.porter_stem(u'abc') == 'abc'
+    with pytest.raises(TypeError) as exc:
+        jf.porter_stem(b'abc')
+    assert 'expected' in str(exc.value)
@@ -13,6 +13,7 @@ import json

 from musicbrainzngs import compat
 from musicbrainzngs import musicbrainz
+from musicbrainzngs.util import _unicode

 hostname = "coverartarchive.org"

@@ -78,7 +79,8 @@ def _caa_request(mbid, imageid=None, size=None, entitytype="release"):
        return resp
    else:
        # Otherwise it's json
-        return json.loads(resp)
+        data = _unicode(resp)
+        return json.loads(data)


 def get_image_list(releaseid):
@@ -88,7 +90,7 @@ def get_image_list(releaseid):
    <http://musicbrainz.org/doc/Cover_Art_Archive/API#.2Frelease.2F.7Bmbid.7D.2F>`_
    returned by the Cover Art Archive API.

-    If an error occurs then a musicbrainz.ResponseError will
+    If an error occurs then a :class:`~musicbrainzngs.ResponseError` will
    be raised with one of the following HTTP codes:

    * 400: `Releaseid` is not a valid UUID
@@ -105,7 +107,7 @@ def get_release_group_image_list(releasegroupid):
    <http://musicbrainz.org/doc/Cover_Art_Archive/API#.2Frelease-group.2F.7Bmbid.7D.2F>`_
    returned by the Cover Art Archive API.

-    If an error occurs then a musicbrainz.ResponseError will
+    If an error occurs then a :class:`~musicbrainzngs.ResponseError` will
    be raised with one of the following HTTP codes:

    * 400: `Releaseid` is not a valid UUID
@@ -147,8 +149,8 @@ def get_image(mbid, coverid, size=None, entitytype="release"):
    If `size` is not specified, download the largest copy present, which can be
    very large.

-    If an error occurs then a musicbrainz.ResponseError will be raised with one
-    of the following HTTP codes:
+    If an error occurs then a :class:`~musicbrainzngs.ResponseError`
+    will be raised with one of the following HTTP codes:

    * 400: `Releaseid` is not a valid UUID or `coverid` is invalid
    * 404: No release exists with an MBID of `releaseid`
@@ -40,8 +40,7 @@ is_py3 = (_ver[0] == 3)
 if is_py2:
 	from StringIO import StringIO
 	from urllib2 import HTTPPasswordMgr, HTTPDigestAuthHandler, Request,\
-						HTTPHandler, build_opener, HTTPError, URLError,\
-						build_opener
+						HTTPHandler, build_opener, HTTPError, URLError
 	from httplib import BadStatusLine, HTTPException
 	from urlparse import urlunparse
 	from urllib import urlencode
@@ -84,8 +84,10 @@ def parse_elements(valid_els, inner_els, element):
        call parse_subelement(<subelement>) and
        return a dict {'subelement': <result>}
        if parse_subelement returns a tuple of the form
-        ('subelement-key', <result>) then return a dict
-        {'subelement-key': <result>} instead
+        (True, {'subelement-key': <result>})
+        then merge the second element of the tuple into the
+        result (which may have a key other than 'subelement' or
+        more than 1 key)
    """
    result = {}
    for sub in element:
@@ -96,8 +98,8 @@ def parse_elements(valid_els, inner_els, element):
            result[t] = sub.text or ""
        elif t in inner_els.keys():
            inner_result = inner_els[t](sub)
-            if isinstance(inner_result, tuple):
-                result[inner_result[0]] = inner_result[1]
+            if isinstance(inner_result, tuple) and inner_result[0]:
+                result.update(inner_result[1])
            else:
                result[t] = inner_result
            # add counts for lists when available
@@ -135,8 +137,10 @@ def parse_message(message):
    result = {}
    valid_elements = {"area": parse_area,
                      "artist": parse_artist,
+                      "instrument": parse_instrument,
                      "label": parse_label,
                      "place": parse_place,
+                      "event": parse_event,
                      "release": parse_release,
                      "release-group": parse_release_group,
                      "series": parse_series,
@@ -153,6 +157,8 @@ def parse_message(message):
                      "artist-list": parse_artist_list,
                      "label-list": parse_label_list,
                      "place-list": parse_place_list,
+                      "event-list": parse_event_list,
+                      "instrument-list": parse_instrument_list,
                      "release-list": parse_release_list,
                      "release-group-list": parse_release_group_list,
                      "series-list": parse_series_list,
@@ -176,9 +182,14 @@ def parse_collection_list(cl):

 def parse_collection(collection):
    result = {}
-    attribs = ["id"]
+    attribs = ["id", "type", "entity-type"]
    elements = ["name", "editor"]
-    inner_els = {"release-list": parse_release_list}
+    inner_els = {"release-list": parse_release_list,
+                 "artist-list": parse_artist_list,
+                 "event-list": parse_event_list,
+                 "place-list": parse_place_list,
+                 "recording-list": parse_recording_list,
+                 "work-list": parse_work_list}
    result.update(parse_attributes(attribs, collection))
    result.update(parse_elements(elements, inner_els, collection))

@@ -275,6 +286,38 @@ def parse_place(place):

    return result

+def parse_event_list(el):
+    return [parse_event(e) for e in el]
+
+def parse_event(event):
+    result = {}
+    attribs = ["id", "type", "ext:score"]
+    elements = ["name", "time", "setlist", "cancelled", "disambiguation", "user-rating"]
+    inner_els = {"life-span": parse_lifespan,
+                 "relation-list": parse_relation_list,
+                 "alias-list": parse_alias_list,
+                 "tag-list": parse_tag_list,
+                 "user-tag-list": parse_tag_list,
+                 "rating": parse_rating}
+
+    result.update(parse_attributes(attribs, event))
+    result.update(parse_elements(elements, inner_els, event))
+
+    return result
+
+def parse_instrument(instrument):
+    result = {}
+    attribs = ["id", "type", "ext:score"]
+    elements = ["name", "description", "disambiguation"]
+    inner_els = {"relation-list": parse_relation_list,
+                 "tag-list": parse_tag_list,
+                 "alias-list": parse_alias_list,
+                 "annotation": parse_annotation}
+    result.update(parse_attributes(attribs, instrument))
+    result.update(parse_elements(elements, inner_els, instrument))
+
+    return result
+
 def parse_label_list(ll):
    return [parse_label(l) for l in ll]

@@ -302,15 +345,15 @@ def parse_label(label):
 def parse_relation_target(tgt):
    attributes = parse_attributes(['id'], tgt)
    if 'id' in attributes:
-        return ('target-id', attributes['id'])
+        return (True, {'target-id': attributes['id']})
    else:
-        return ('target-id', tgt.text)
+        return (True, {'target-id': tgt.text})

 def parse_relation_list(rl):
    attribs = ["target-type"]
    ttype = parse_attributes(attribs, rl)
    key = "%s-relation-list" % ttype["target-type"]
-    return (key, [parse_relation(r) for r in rl])
+    return (True, {key: [parse_relation(r) for r in rl]})

 def parse_relation(relation):
    result = {}
@@ -318,8 +361,10 @@ def parse_relation(relation):
    elements = ["target", "direction", "begin", "end", "ended", "ordering-key"]
    inner_els = {"area": parse_area,
                 "artist": parse_artist,
+                 "instrument": parse_instrument,
                 "label": parse_label,
                 "place": parse_place,
+                 "event": parse_event,
                 "recording": parse_recording,
                 "release": parse_release,
                 "release-group": parse_release_group,
@@ -330,9 +375,34 @@ def parse_relation(relation):
                }
    result.update(parse_attributes(attribs, relation))
    result.update(parse_elements(elements, inner_els, relation))
+    # We parse attribute-list again to get attributes that have both
+    # text and attribute values
+    result.update(parse_elements([], {"attribute-list": parse_relation_attribute_list}, relation))

    return result

+def parse_relation_attribute_list(attributelist):
+    ret = []
+    for attribute in attributelist:
+        ret.append(parse_relation_attribute_element(attribute))
+    return (True, {"attributes": ret})
+
+def parse_relation_attribute_element(element):
+    # Parses an attribute into a dictionary containing an element
+    # {"attribute": <text value>} and also an additional element
+    # containing any xml attributes.
+    # e.g <attribute value="BuxWV 1">number</attribute>
+    # -> {"attribute": "number", "value": "BuxWV 1"}
+    result = {}
+    for attr in element.attrib:
+        if "{" in attr:
+            a = fixtag(attr, NS_MAP)[0]
+        else:
+            a = attr
+        result[a] = element.attrib[attr]
+    result["attribute"] = element.text
+    return result
+
 def parse_release(release):
    result = {}
    attribs = ["id", "ext:score"]
@@ -359,7 +429,22 @@ def parse_release(release):
    return result

 def parse_medium_list(ml):
-    return [parse_medium(m) for m in ml]
+    """medium-list results from search have an additional
+    <track-count> element containing the number of tracks
+    over all mediums. Optionally add this"""
+    medium_list = []
+    track_count = None
+    for m in ml:
+        tag = fixtag(m.tag, NS_MAP)[0]
+        if tag == "ws2:medium":
+            medium_list.append(parse_medium(m))
+        elif tag == "ws2:track-count":
+            track_count = int(m.text)
+    ret = {"medium-list": medium_list}
+    if track_count is not None:
+        ret["medium-track-count"] = track_count
+
+    return (True, ret)

 def parse_release_event_list(rel):
    return [parse_release_event(re) for re in rel]
@@ -376,7 +461,9 @@ def parse_medium(medium):
    result = {}
    elements = ["position", "format", "title"]
    inner_els = {"disc-list": parse_disc_list,
-                 "track-list": parse_track_list}
+                 "pregap": parse_track,
+                 "track-list": parse_track_list,
+                 "data-track-list": parse_track_list}

    result.update(parse_elements(elements, inner_els, medium))
    return result
@@ -477,11 +564,12 @@ def parse_work_attribute_list(wal):
    return [parse_work_attribute(wa) for wa in wal]

 def parse_work_attribute(wa):
-    result = {}
    attribs = ["type"]
-
-    result.update(parse_attributes(attribs, wa))
-    result["attribute"] = wa.text
+    typeinfo = parse_attributes(attribs, wa)
+    result = {}
+    if typeinfo:
+        result = {"attribute": typeinfo["type"],
+                  "value": wa.text}

    return result

@@ -504,7 +592,9 @@ def parse_disc(disc):
    result = {}
    attribs = ["id"]
    elements = ["sectors"]
-    inner_els = {"release-list": parse_release_list}
+    inner_els = {"release-list": parse_release_list,
+                 "offset-list": parse_offset_list
+    }

    result.update(parse_attributes(attribs, disc))
    result.update(parse_elements(elements, inner_els, disc))
@@ -522,6 +612,15 @@ def parse_cdstub(cdstub):

    return result

+def parse_offset_list(ol):
+    return [int(o.text) for o in ol]
+
+def parse_instrument_list(rl):
+    result = []
+    for r in rl:
+        result.append(parse_instrument(r))
+    return result
+
 def parse_release_list(rl):
    result = []
    for r in rl:
@@ -20,16 +20,17 @@ from musicbrainzngs import mbxml
 from musicbrainzngs import util
 from musicbrainzngs import compat

+# headphones
 import base64

-_version = "0.6devMODIFIED"
+_version = "0.7devheadphones"
 _log = logging.getLogger("musicbrainzngs")

 LUCENE_SPECIAL = r'([+\-&|!(){}\[\]\^"~*?:\\\/])'

 # Constants for validation.

-RELATABLE_TYPES = ['area', 'artist', 'label', 'place', 'recording', 'release', 'release-group', 'series', 'url', 'work']
+RELATABLE_TYPES = ['area', 'artist', 'label', 'place', 'event', 'recording', 'release', 'release-group', 'series', 'url', 'work', 'instrument']
 RELATION_INCLUDES = [entity + '-rels' for entity in RELATABLE_TYPES]
 TAG_INCLUDES = ["tags", "user-tags"]
 RATING_INCLUDES = ["ratings", "user-ratings"]
@@ -44,19 +45,19 @@ VALID_INCLUDES = {
    'annotation': [

    ],
-    'instrument': [
-
-    ],
+    'instrument': ["aliases", "annotation"
+    ] + RELATION_INCLUDES + TAG_INCLUDES,
    'label': [
        "releases", # Subqueries
        "discids", "media",
        "aliases", "annotation"
    ] + RELATION_INCLUDES + TAG_INCLUDES + RATING_INCLUDES,
    'place' : ["aliases", "annotation"] + RELATION_INCLUDES + TAG_INCLUDES,
+    'event' : ["aliases"] + RELATION_INCLUDES + TAG_INCLUDES + RATING_INCLUDES,
    'recording': [
        "artists", "releases", # Subqueries
        "discids", "media", "artist-credits", "isrcs",
-        "annotation", "aliases"
+        "work-level-rels", "annotation", "aliases"
    ] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
    'release': [
        "artists", "labels", "recordings", "release-groups", "media",
@@ -85,13 +86,16 @@ VALID_INCLUDES = {
    'collection': ['releases'],
 }
 VALID_BROWSE_INCLUDES = {
-    'releases': ["artist-credits", "labels", "recordings", "isrcs",
+    'artist': ["aliases"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
+    'event': ["aliases"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
+    'label': ["aliases"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
+    'recording': ["artist-credits", "isrcs"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
+    'release': ["artist-credits", "labels", "recordings", "isrcs",
                "release-groups", "media", "discids"] + RELATION_INCLUDES,
-    'recordings': ["artist-credits", "isrcs"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
-    'labels': ["aliases"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
-    'artists': ["aliases"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
-    'urls': RELATION_INCLUDES,
-    'release-groups': ["artist-credits"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES
+    'place': ["aliases"] + TAG_INCLUDES + RELATION_INCLUDES,
+    'release-group': ["artist-credits"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
+    'url': RELATION_INCLUDES,
+    'work': ["aliases", "annotation"] + TAG_INCLUDES + RATING_INCLUDES + RELATION_INCLUDES,
 }

 #: These can be used to filter whenever releases are includes or browsed
@@ -264,21 +268,26 @@ def _check_filter_and_make_params(entity, includes, release_status=[], release_t
        params["type"] = "|".join(release_type)
    return params

-def _docstring(entity, browse=False):
+def _docstring_get(entity):
+    includes = list(VALID_INCLUDES.get(entity, []))
+    return _docstring_impl("includes", includes)
+
+def _docstring_browse(entity):
+    includes = list(VALID_BROWSE_INCLUDES.get(entity, []))
+    return _docstring_impl("includes", includes)
+
+def _docstring_search(entity):
+    search_fields = list(VALID_SEARCH_FIELDS.get(entity, []))
+    return _docstring_impl("fields", search_fields)
+
+def _docstring_impl(name, values):
    def _decorator(func):
-        if browse:
-            includes = list(VALID_BROWSE_INCLUDES.get(entity, []))
-        else:
-            includes = list(VALID_INCLUDES.get(entity, []))
        # puids are allowed so nothing breaks, but not documented
-        if "puids" in includes: includes.remove("puids")
-        includes = ", ".join(includes)
+        if "puids" in values: values.remove("puids")
+        vstr = ", ".join(values)
+        args = {name: vstr}
        if func.__doc__:
-            search_fields = list(VALID_SEARCH_FIELDS.get(entity, []))
-            # puid is allowed so nothing breaks, but not documented
-            if "puid" in search_fields: search_fields.remove("puid")
-            func.__doc__ = func.__doc__.format(includes=includes,
-                    fields=", ".join(search_fields))
+            func.__doc__ = func.__doc__.format(**args)
        return func

    return _decorator
@@ -299,7 +308,8 @@ def auth(u, p):
 	global user, password
 	user = u
 	password = p
-	
+
+# headphones
 def hpauth(u, p):
    """Set the username and password to be used in subsequent queries to
    the MusicBrainz XML API that require authentication.
@@ -329,8 +339,9 @@ def set_useragent(app, version, contact=None):
    _log.debug("set user-agent to %s" % _useragent)

 def set_hostname(new_hostname):
-    """Set the base hostname for MusicBrainz webservice requests.
-    Defaults to 'musicbrainz.org'."""
+    """Set the hostname for MusicBrainz webservice requests.
+    Defaults to 'musicbrainz.org'.
+    You can also include a port: 'localhost:8000'."""
    global hostname
    hostname = new_hostname

@@ -471,7 +482,7 @@ class _MusicbrainzHttpRequest(compat.Request):

 # Core (internal) functions for calling the MB API.

-def _safe_read(opener, req, body=None, max_retries=3, retry_delay_delta=2.0):
+def _safe_read(opener, req, body=None, max_retries=8, retry_delay_delta=2.0):
 	"""Open an HTTP request with a given URL opener and (optionally) a
 	request body. Transient errors lead to retries.  Permanent errors
 	and repeated errors are translated into a small set of handleable
@@ -673,7 +684,6 @@ def _mb_request(path, method='GET', auth_required=AUTH_NO,
    # Make request.
    req = _MusicbrainzHttpRequest(method, url, data)
    req.add_header('User-Agent', _useragent)
-    

    # Add headphones credentials
    if mb_auth:
@@ -806,7 +816,7 @@ def _do_mb_post(path, body):

 # Single entity by ID

-@_docstring('area')
+@_docstring_get("area")
 def get_area_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the area with the MusicBrainz `id` as a dict with an 'area' key.

@@ -815,7 +825,7 @@ def get_area_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("area", id, includes, params)

-@_docstring('artist')
+@_docstring_get("artist")
 def get_artist_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the artist with the MusicBrainz `id` as a dict with an 'artist' key.

@@ -824,7 +834,7 @@ def get_artist_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("artist", id, includes, params)

-@_docstring('instrument')
+@_docstring_get("instrument")
 def get_instrument_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the instrument with the MusicBrainz `id` as a dict with an 'artist' key.

@@ -833,7 +843,7 @@ def get_instrument_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("instrument", id, includes, params)

-@_docstring('label')
+@_docstring_get("label")
 def get_label_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the label with the MusicBrainz `id` as a dict with a 'label' key.

@@ -842,7 +852,7 @@ def get_label_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("label", id, includes, params)

-@_docstring('place')
+@_docstring_get("place")
 def get_place_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the place with the MusicBrainz `id` as a dict with an 'place' key.

@@ -851,7 +861,19 @@ def get_place_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("place", id, includes, params)

-@_docstring('recording')
+@_docstring_get("event")
+def get_event_by_id(id, includes=[], release_status=[], release_type=[]):
+    """Get the event with the MusicBrainz `id` as a dict with an 'event' key.
+
+    The event dict has the following keys:
+    `id`, `type`, `name`, `time`, `disambiguation` and `life-span`.
+
+    *Available includes*: {includes}"""
+    params = _check_filter_and_make_params("event", includes,
+                                           release_status, release_type)
+    return _do_mb_query("event", id, includes, params)
+
+@_docstring_get("recording")
 def get_recording_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the recording with the MusicBrainz `id` as a dict
    with a 'recording' key.
@@ -861,7 +883,7 @@ def get_recording_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("recording", id, includes, params)

-@_docstring('release')
+@_docstring_get("release")
 def get_release_by_id(id, includes=[], release_status=[], release_type=[]):
    """Get the release with the MusicBrainz `id` as a dict with a 'release' key.

@@ -870,7 +892,7 @@ def get_release_by_id(id, includes=[], release_status=[], release_type=[]):
                                           release_status, release_type)
    return _do_mb_query("release", id, includes, params)

-@_docstring('release-group')
+@_docstring_get("release-group")
 def get_release_group_by_id(id, includes=[],
                            release_status=[], release_type=[]):
    """Get the release group with the MusicBrainz `id` as a dict
@@ -881,21 +903,21 @@ def get_release_group_by_id(id, includes=[],
                                           release_status, release_type)
    return _do_mb_query("release-group", id, includes, params)

-@_docstring('series')
+@_docstring_get("series")
 def get_series_by_id(id, includes=[]):
    """Get the series with the MusicBrainz `id` as a dict with a 'series' key.

    *Available includes*: {includes}"""
    return _do_mb_query("series", id, includes)

-@_docstring('work')
+@_docstring_get("work")
 def get_work_by_id(id, includes=[]):
    """Get the work with the MusicBrainz `id` as a dict with a 'work' key.

    *Available includes*: {includes}"""
    return _do_mb_query("work", id, includes)

-@_docstring('url')
+@_docstring_get("url")
 def get_url_by_id(id, includes=[]):
    """Get the url with the MusicBrainz `id` as a dict with a 'url' key.

@@ -905,35 +927,56 @@ def get_url_by_id(id, includes=[]):

 # Searching

-@_docstring('annotation')
+@_docstring_search("annotation")
 def search_annotations(query='', limit=None, offset=None, strict=False, **fields):
    """Search for annotations and return a dict with an 'annotation-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('annotation', query, fields, limit, offset, strict)

-@_docstring('area')
+@_docstring_search("area")
 def search_areas(query='', limit=None, offset=None, strict=False, **fields):
    """Search for areas and return a dict with an 'area-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('area', query, fields, limit, offset, strict)

-@_docstring('artist')
+@_docstring_search("artist")
 def search_artists(query='', limit=None, offset=None, strict=False, **fields):
    """Search for artists and return a dict with an 'artist-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('artist', query, fields, limit, offset, strict)

-@_docstring('label')
+@_docstring_search("event")
+def search_events(query='', limit=None, offset=None, strict=False, **fields):
+    """Search for events and return a dict with an 'event-list' key.
+
+    *Available search fields*: {fields}"""
+    return _do_mb_search('event', query, fields, limit, offset, strict)
+
+@_docstring_search("instrument")
+def search_instruments(query='', limit=None, offset=None, strict=False, **fields):
+    """Search for instruments and return a dict with a 'instrument-list' key.
+
+    *Available search fields*: {fields}"""
+    return _do_mb_search('instrument', query, fields, limit, offset, strict)
+
+@_docstring_search("label")
 def search_labels(query='', limit=None, offset=None, strict=False, **fields):
    """Search for labels and return a dict with a 'label-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('label', query, fields, limit, offset, strict)

-@_docstring('recording')
+@_docstring_search("place")
+def search_places(query='', limit=None, offset=None, strict=False, **fields):
+    """Search for places and return a dict with a 'place-list' key.
+
+    *Available search fields*: {fields}"""
+    return _do_mb_search('place', query, fields, limit, offset, strict)
+
+@_docstring_search("recording")
 def search_recordings(query='', limit=None, offset=None,
                      strict=False, **fields):
    """Search for recordings and return a dict with a 'recording-list' key.
@@ -941,14 +984,14 @@ def search_recordings(query='', limit=None, offset=None,
    *Available search fields*: {fields}"""
    return _do_mb_search('recording', query, fields, limit, offset, strict)

-@_docstring('release')
+@_docstring_search("release")
 def search_releases(query='', limit=None, offset=None, strict=False, **fields):
    """Search for recordings and return a dict with a 'recording-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('release', query, fields, limit, offset, strict)

-@_docstring('release-group')
+@_docstring_search("release-group")
 def search_release_groups(query='', limit=None, offset=None,
 			  strict=False, **fields):
    """Search for release groups and return a dict
@@ -957,14 +1000,14 @@ def search_release_groups(query='', limit=None, offset=None,
    *Available search fields*: {fields}"""
    return _do_mb_search('release-group', query, fields, limit, offset, strict)

-@_docstring('series')
+@_docstring_search("series")
 def search_series(query='', limit=None, offset=None, strict=False, **fields):
    """Search for series and return a dict with a 'series-list' key.

    *Available search fields*: {fields}"""
    return _do_mb_search('series', query, fields, limit, offset, strict)

-@_docstring('work')
+@_docstring_search("work")
 def search_works(query='', limit=None, offset=None, strict=False, **fields):
    """Search for works and return a dict with a 'work-list' key.

@@ -973,7 +1016,7 @@ def search_works(query='', limit=None, offset=None, strict=False, **fields):


 # Lists of entities
-@_docstring('discid')
+@_docstring_get("discid")
 def get_releases_by_discid(id, includes=[], toc=None, cdstubs=True, media_format=None):
    """Search for releases with a :musicbrainz:`Disc ID` or table of contents.

@@ -994,8 +1037,8 @@ def get_releases_by_discid(id, includes=[], toc=None, cdstubs=True, media_format

    The result is a dict with either a 'disc' , a 'cdstub' key
    or a 'release-list' (fuzzy match with TOC).
-    A 'disc' has a 'release-list' and a 'cdstub' key has direct 'artist'
-    and 'title' keys.
+    A 'disc' has an 'offset-count', an 'offset-list' and a 'release-list'.
+    A 'cdstub' key has direct 'artist' and 'title' keys.

    *Available includes*: {includes}"""
    params = _check_filter_and_make_params("discid", includes, release_status=[],
@@ -1008,7 +1051,7 @@ def get_releases_by_discid(id, includes=[], toc=None, cdstubs=True, media_format
        params["media-format"] = media_format
    return _do_mb_query("discid", id, includes, params)

-@_docstring('recording')
+@_docstring_get("recording")
 def get_recordings_by_echoprint(echoprint, includes=[], release_status=[],
                                release_type=[]):
    """Search for recordings with an `echoprint <http://echoprint.me>`_.
@@ -1019,7 +1062,7 @@ def get_recordings_by_echoprint(echoprint, includes=[], release_status=[],
    raise ResponseError(cause=compat.HTTPError(
                                            None, 404, "Not Found", None, None))

-@_docstring('recording')
+@_docstring_get("recording")
 def get_recordings_by_puid(puid, includes=[], release_status=[],
                           release_type=[]):
    """Search for recordings with a :musicbrainz:`PUID`.
@@ -1030,7 +1073,7 @@ def get_recordings_by_puid(puid, includes=[], release_status=[],
    raise ResponseError(cause=compat.HTTPError(
                                            None, 404, "Not Found", None, None))

-@_docstring('recording')
+@_docstring_get("recording")
 def get_recordings_by_isrc(isrc, includes=[], release_status=[],
                           release_type=[]):
    """Search for recordings with an :musicbrainz:`ISRC`.
@@ -1042,7 +1085,7 @@ def get_recordings_by_isrc(isrc, includes=[], release_status=[],
                                           release_status, release_type)
    return _do_mb_query("isrc", isrc, includes, params)

-@_docstring('work')
+@_docstring_get("work")
 def get_works_by_iswc(iswc, includes=[]):
    """Search for works with an :musicbrainz:`ISWC`.
    The result is a dict with a`work-list`.
@@ -1051,7 +1094,9 @@ def get_works_by_iswc(iswc, includes=[]):
    return _do_mb_query("iswc", iswc, includes)


-def _browse_impl(entity, includes, valid_includes, limit, offset, params, release_status=[], release_type=[]):
+def _browse_impl(entity, includes, limit, offset, params, release_status=[], release_type=[]):
+    includes = includes if isinstance(includes, list) else [includes]
+    valid_includes = VALID_BROWSE_INCLUDES[entity]
    _check_includes_impl(includes, valid_includes)
    p = {}
    for k,v in params.items():
@@ -1068,45 +1113,59 @@ def _browse_impl(entity, includes, valid_includes, limit, offset, params, releas
 # Browse methods
 # Browse include are a subset of regular get includes, so we check them here
 # and the test in _do_mb_query will pass anyway.
-@_docstring('artists', browse=True)
+@_docstring_browse("artist")
 def browse_artists(recording=None, release=None, release_group=None,
-                   includes=[], limit=None, offset=None):
+                   work=None, includes=[], limit=None, offset=None):
    """Get all artists linked to a recording, a release or a release group.
    You need to give one MusicBrainz ID.

    *Available includes*: {includes}"""
-    # optional parameter work?
-    valid_includes = VALID_BROWSE_INCLUDES['artists']
    params = {"recording": recording,
              "release": release,
-              "release-group": release_group}
-    return _browse_impl("artist", includes, valid_includes,
-                        limit, offset, params)
+              "release-group": release_group,
+              "work": work}
+    return _browse_impl("artist", includes, limit, offset, params)

-@_docstring('labels', browse=True)
+@_docstring_browse("event")
+def browse_events(area=None, artist=None, place=None,
+                   includes=[], limit=None, offset=None):
+    """Get all events linked to a area, a artist or a place.
+    You need to give one MusicBrainz ID.
+
+    *Available includes*: {includes}"""
+    params = {"area": area,
+              "artist": artist,
+              "place": place}
+    return _browse_impl("event", includes, limit, offset, params)
+
+@_docstring_browse("label")
 def browse_labels(release=None, includes=[], limit=None, offset=None):
    """Get all labels linked to a relase. You need to give a MusicBrainz ID.

    *Available includes*: {includes}"""
-    valid_includes = VALID_BROWSE_INCLUDES['labels']
    params = {"release": release}
-    return _browse_impl("label", includes, valid_includes,
-                        limit, offset, params)
+    return _browse_impl("label", includes, limit, offset, params)

-@_docstring('recordings', browse=True)
+@_docstring_browse("place")
+def browse_places(area=None, includes=[], limit=None, offset=None):
+    """Get all places linked to an area. You need to give a MusicBrainz ID.
+
+    *Available includes*: {includes}"""
+    params = {"area": area}
+    return _browse_impl("place", includes, limit, offset, params)
+
+@_docstring_browse("recording")
 def browse_recordings(artist=None, release=None, includes=[],
                      limit=None, offset=None):
    """Get all recordings linked to an artist or a release.
    You need to give one MusicBrainz ID.

    *Available includes*: {includes}"""
-    valid_includes = VALID_BROWSE_INCLUDES['recordings']
    params = {"artist": artist,
              "release": release}
-    return _browse_impl("recording", includes, valid_includes,
-                        limit, offset, params)
+    return _browse_impl("recording", includes, limit, offset, params)

-@_docstring('releases', browse=True)
+@_docstring_browse("release")
 def browse_releases(artist=None, track_artist=None, label=None, recording=None,
                    release_group=None, release_status=[], release_type=[],
                    includes=[], limit=None, offset=None):
@@ -1121,16 +1180,15 @@ def browse_releases(artist=None, track_artist=None, label=None, recording=None,

    *Available includes*: {includes}"""
    # track_artist param doesn't work yet
-    valid_includes = VALID_BROWSE_INCLUDES['releases']
    params = {"artist": artist,
              "track_artist": track_artist,
              "label": label,
              "recording": recording,
              "release-group": release_group}
-    return _browse_impl("release", includes, valid_includes, limit, offset,
+    return _browse_impl("release", includes, limit, offset,
                        params, release_status, release_type)

-@_docstring('release-groups', browse=True)
+@_docstring_browse("release-group")
 def browse_release_groups(artist=None, release=None, release_type=[],
                          includes=[], limit=None, offset=None):
    """Get all release groups linked to an artist or a release.
@@ -1139,25 +1197,27 @@ def browse_release_groups(artist=None, release=None, release_type=[],
    You can filter by :data:`musicbrainz.VALID_RELEASE_TYPES`.

    *Available includes*: {includes}"""
-    valid_includes = VALID_BROWSE_INCLUDES['release-groups']
    params = {"artist": artist,
              "release": release}
-    return _browse_impl("release-group", includes, valid_includes,
-                        limit, offset, params, [], release_type)
+    return _browse_impl("release-group", includes, limit,
+                        offset, params, [], release_type)

-@_docstring('urls', browse=True)
+@_docstring_browse("url")
 def browse_urls(resource=None, includes=[], limit=None, offset=None):
    """Get urls by actual URL string.
    You need to give a URL string as 'resource'

    *Available includes*: {includes}"""
-    # optional parameter work?
-    valid_includes = VALID_BROWSE_INCLUDES['urls']
    params = {"resource": resource}
-    return _browse_impl("url", includes, valid_includes,
-                        limit, offset, params)
+    return _browse_impl("url", includes, limit, offset, params)

-# browse_work is defined in the docs but has no browse criteria
+@_docstring_browse("work")
+def browse_works(artist=None, includes=[], limit=None, offset=None):
+    """Get all works linked to an artist
+
+    *Available includes*: {includes}"""
+    params = {"artist": artist}
+    return _browse_impl("work", includes, limit, offset, params)

 # Collections
 def get_collections():
@@ -1166,16 +1226,59 @@ def get_collections():
    # Missing <release-list count="n"> the count in the reply
    return _do_mb_query("collection", '')

+def _do_collection_query(collection, collection_type, limit, offset):
+    params = {}
+    if limit: params["limit"] = limit
+    if offset: params["offset"] = offset
+    return _do_mb_query("collection", "%s/%s" % (collection, collection_type), [], params)
+
+def get_artists_in_collection(collection, limit=None, offset=None):
+    """List the artists in a collection.
+    Returns a dict with a 'collection' key, which again has a 'artist-list'.
+
+    See `Browsing`_ for how to use `limit` and `offset`.
+    """
+    return _do_collection_query(collection, "artists", limit, offset)
+
 def get_releases_in_collection(collection, limit=None, offset=None):
    """List the releases in a collection.
    Returns a dict with a 'collection' key, which again has a 'release-list'.

    See `Browsing`_ for how to use `limit` and `offset`.
    """
-    params = {}
-    if limit: params["limit"] = limit
-    if offset: params["offset"] = offset
-    return _do_mb_query("collection", "%s/releases" % collection, [], params)
+    return _do_collection_query(collection, "releases", limit, offset)
+
+def get_events_in_collection(collection, limit=None, offset=None):
+    """List the events in a collection.
+    Returns a dict with a 'collection' key, which again has a 'event-list'.
+
+    See `Browsing`_ for how to use `limit` and `offset`.
+    """
+    return _do_collection_query(collection, "events", limit, offset)
+
+def get_places_in_collection(collection, limit=None, offset=None):
+    """List the places in a collection.
+    Returns a dict with a 'collection' key, which again has a 'place-list'.
+
+    See `Browsing`_ for how to use `limit` and `offset`.
+    """
+    return _do_collection_query(collection, "places", limit, offset)
+
+def get_recordings_in_collection(collection, limit=None, offset=None):
+    """List the recordings in a collection.
+    Returns a dict with a 'collection' key, which again has a 'recording-list'.
+
+    See `Browsing`_ for how to use `limit` and `offset`.
+    """
+    return _do_collection_query(collection, "recordings", limit, offset)
+
+def get_works_in_collection(collection, limit=None, offset=None):
+    """List the works in a collection.
+    Returns a dict with a 'collection' key, which again has a 'work-list'.
+
+    See `Browsing`_ for how to use `limit` and `offset`.
+    """
+    return _do_collection_query(collection, "works", limit, offset)


 # Submission methods
@@ -1219,11 +1322,17 @@ def submit_tags(**kwargs):
    Takes parameters named e.g. 'artist_tags', 'recording_tags', etc.,
    and of the form:
    {entity_id1: [tag1, ...], ...}
+    If you only have one tag for an entity you can use a string instead
+    of a list.

    The user's tags for each entity will be set to that list, adding or
    removing tags as necessary. Submitting an empty list for an entity
    will remove all tags for that entity by the user.
    """
+    for k, v in kwargs.items():
+        for id, tags in v.items():
+            kwargs[k][id] = tags if isinstance(tags, list) else [tags]
+
    query = mbxml.make_tag_request(**kwargs)
    return _do_mb_post("tag", query)

@@ -1,58 +0,0 @@
-Mutagen
-=======
-
-Mutagen is a Python module to handle audio metadata. It supports ASF, FLAC, 
-M4A, Monkey's Audio, MP3, Musepack, Ogg Opus, Ogg FLAC, Ogg Speex, Ogg 
-Theora, Ogg Vorbis, True Audio, WavPack, OptimFROG, and AIFF audio files. 
-All versions of ID3v2 are supported, and all standard ID3v2.4 frames are 
-parsed. It can read Xing headers to accurately calculate the bitrate and 
-length of MP3s. ID3 and APEv2 tags can be edited regardless of audio 
-format. It can also manipulate Ogg streams on an individual packet/page 
-level.
-
-Mutagen works on Python 2.6, 2.7, 3.3, 3.4 (CPython and PyPy) and has no 
-dependencies outside the Python standard library.
-
-
-Installing
----------
-
- $ ./setup.py build
- $ su -c "./setup.py install"
-
-
-Documentation
-------------
-
-The primary documentation for Mutagen is the doc strings found in
-the source code and the sphinx documentation in the docs/ directory.
-
-To build the docs (needs sphinx):
-
- $ ./setup.py build_sphinx
-
-The tools/ directory contains several useful examples.
-
-The docs are also hosted on readthedocs.org:
-
- http://mutagen.readthedocs.org
-
-
-Testing the Module
------------------
-
-To test Mutagen's MP3 reading support, run
- $ tools/mutagen-pony <your top-level MP3 directory here>
-Mutagen will try to load all of them, and report any errors.
-
-To look at the tags in files, run
- $ tools/mutagen-inspect filename ...
-
-To run our test suite,
- $ ./setup.py test
-
-
-Compatibility/Bugs
------------------
-
-See docs/bugs.rst
@@ -1,11 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2005  Michael Urman
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
-
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Mutagen aims to be an all purpose multimedia tagging library.

@@ -14,7 +13,7 @@
    import mutagen.[format]
    metadata = mutagen.[format].Open(filename)

-`metadata` acts like a dictionary of tags in the file. Tags are generally a
+``metadata`` acts like a dictionary of tags in the file. Tags are generally a
 list of string-like values, but may have additional methods available
 depending on tag or format. They may also be entirely different objects
 for certain keys, again depending on format.
@@ -22,9 +21,9 @@ for certain keys, again depending on format.

 from mutagen._util import MutagenError
 from mutagen._file import FileType, StreamInfo, File
-from mutagen._tags import Metadata
+from mutagen._tags import Tags, Metadata, PaddingInfo

-version = (1, 27)
+version = (1, 38, -1)
 """Version tuple."""

 version_string = ".".join(map(str, version))
@@ -38,4 +37,8 @@ StreamInfo

 File

+Tags
+
 Metadata
+
+PaddingInfo
@@ -1,10 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2013  Christoph Reiter
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 import sys

@@ -16,6 +16,7 @@ if PY2:
    from StringIO import StringIO
    BytesIO = StringIO
    from cStringIO import StringIO as cBytesIO
+    from itertools import izip

    long_ = long
    integer_types = (int, long)
@@ -57,6 +58,7 @@ elif PY3:
    string_types = (str,)
    text_type = str

+    izip = zip
    xrange = range
    cmp = lambda a, b: (a > b) - (a < b)
    chr_ = lambda x: bytes([x])
@@ -1,4 +1,9 @@
 # -*- coding: utf-8 -*-
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Constants used by Mutagen."""

@@ -1,21 +1,26 @@
+# -*- coding: utf-8 -*-
 # Copyright (C) 2005  Michael Urman
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 import warnings

-from mutagen._util import DictMixin
+from mutagen._util import DictMixin, loadfile
+from mutagen._compat import izip


 class FileType(DictMixin):
-    """An abstract object wrapping tags and audio stream information.
+    """FileType(filething, **kwargs)

-    Attributes:
+    Args:
+        filething (filething): A filename or a file-like object

-    * info -- stream information (length, bitrate, sample rate)
-    * tags -- metadata tags, if any
+    Subclasses might take further options via keyword arguments.
+
+    An abstract object wrapping tags and audio stream information.

    Each file format has different potential tags and stream
    information.
@@ -23,6 +28,10 @@ class FileType(DictMixin):
    FileTypes implement an interface very similar to Metadata; the
    dict interface, save, load, and delete calls on a FileType call
    the appropriate methods on its tag data.
+
+    Attributes:
+        info (`StreamInfo`): contains length, bitrate, sample rate
+        tags (`Tags`): metadata tags, if any, otherwise `None`
    """

    __module__ = "mutagen"
@@ -32,14 +41,15 @@ class FileType(DictMixin):
    filename = None
    _mimes = ["application/octet-stream"]

-    def __init__(self, filename=None, *args, **kwargs):
-        if filename is None:
+    def __init__(self, *args, **kwargs):
+        if not args and not kwargs:
            warnings.warn("FileType constructor requires a filename",
                          DeprecationWarning)
        else:
-            self.load(filename, *args, **kwargs)
+            self.load(*args, **kwargs)

-    def load(self, filename, *args, **kwargs):
+    @loadfile()
+    def load(self, filething, *args, **kwargs):
        raise NotImplementedError

    def __getitem__(self, key):
@@ -86,34 +96,47 @@ class FileType(DictMixin):
        else:
            return self.tags.keys()

-    def delete(self, filename=None):
-        """Remove tags from a file."""
+    @loadfile(writable=True)
+    def delete(self, filething):
+        """delete(filething=None)
+
+        Remove tags from a file.
+
+        In cases where the tagging format is independent of the file type
+        (for example `mutagen.id3.ID3`) all traces of the tagging format will
+        be removed.
+        In cases where the tag is part of the file type, all tags and
+        padding will be removed.
+
+        The tags attribute will be cleared as well if there is one.
+
+        Does nothing if the file has no tags.
+
+        Raises:
+            MutagenError: if deleting wasn't possible
+        """

        if self.tags is not None:
-            if filename is None:
-                filename = self.filename
-            else:
-                warnings.warn(
-                    "delete(filename=...) is deprecated, reload the file",
-                    DeprecationWarning)
-            return self.tags.delete(filename)
+            return self.tags.delete(filething)

-    def save(self, filename=None, **kwargs):
-        """Save metadata tags."""
+    @loadfile(writable=True)
+    def save(self, filething, **kwargs):
+        """save(filething=None, **kwargs)
+
+        Save metadata tags.
+
+        Raises:
+            MutagenError: if saving wasn't possible
+        """

-        if filename is None:
-            filename = self.filename
-        else:
-            warnings.warn(
-                "save(filename=...) is deprecated, reload the file",
-                DeprecationWarning)
        if self.tags is not None:
-            return self.tags.save(filename, **kwargs)
-        else:
-            raise ValueError("no tags in file")
+            return self.tags.save(filething, **kwargs)

    def pprint(self):
-        """Print stream information and comment key=value pairs."""
+        """
+        Returns:
+            text: stream information and comment key=value pairs.
+        """

        stream = "%s (%s)" % (self.info.pprint(), self.mime[0])
        try:
@@ -126,14 +149,15 @@ class FileType(DictMixin):
    def add_tags(self):
        """Adds new tags to the file.

-        Raises if tags already exist.
+        Raises:
+            MutagenError: if tags already exist or adding is not possible.
        """

        raise NotImplementedError

    @property
    def mime(self):
-        """A list of mime types"""
+        """A list of mime types (`text`)"""

        mimes = []
        for Kind in type(self).__mro__:
@@ -144,6 +168,20 @@ class FileType(DictMixin):

    @staticmethod
    def score(filename, fileobj, header):
+        """Returns a score for how likely the file can be parsed by this type.
+
+        Args:
+            filename (path): a file path
+            fileobj (fileobj): a file object open in rb mode. Position is
+                undefined
+            header (bytes): data of undefined length, starts with the start of
+                the file.
+
+        Returns:
+            int: negative if definitely not a matching type, otherwise a score,
+                the bigger the more certain that the file can be loaded.
+        """
+
        raise NotImplementedError


@@ -158,13 +196,19 @@ class StreamInfo(object):
    __module__ = "mutagen"

    def pprint(self):
-        """Print stream information"""
+        """
+        Returns:
+            text: Print stream information
+        """

        raise NotImplementedError


-def File(filename, options=None, easy=False):
-    """Guess the type of the file and try to open it.
+@loadfile(method=False)
+def File(filething, options=None, easy=False):
+    """File(filething, options=None, easy=False)
+
+    Guess the type of the file and try to open it.

    The file type is decided by several things, such as the first 128
    bytes (which usually contains a file type identifier), the
@@ -172,12 +216,20 @@ def File(filename, options=None, easy=False):

    If no appropriate type could be found, None is returned.

-    :param options: Sequence of :class:`FileType` implementations, defaults to
-                    all included ones.
+    Args:
+        filething (filething)
+        options: Sequence of :class:`FileType` implementations,
+            defaults to all included ones.
+        easy (bool):  If the easy wrappers should be returnd if available.
+            For example :class:`EasyMP3 <mp3.EasyMP3>` instead of
+            :class:`MP3 <mp3.MP3>`.

-    :param easy: If the easy wrappers should be returnd if available.
-                 For example :class:`EasyMP3 <mp3.EasyMP3>` instead
-                 of :class:`MP3 <mp3.MP3>`.
+    Returns:
+        FileType: A FileType instance for the detected type or `None` in case
+            the type couln't be determined.
+
+    Raises:
+        MutagenError: in case the detected type fails to load the file.
    """

    if options is None:
@@ -211,27 +263,37 @@ def File(filename, options=None, easy=False):
        from mutagen.optimfrog import OptimFROG
        from mutagen.aiff import AIFF
        from mutagen.aac import AAC
+        from mutagen.smf import SMF
+        from mutagen.dsf import DSF
        options = [MP3, TrueAudio, OggTheora, OggSpeex, OggVorbis, OggFLAC,
                   FLAC, AIFF, APEv2File, MP4, ID3FileType, WavPack,
-                   Musepack, MonkeysAudio, OptimFROG, ASF, OggOpus, AAC]
+                   Musepack, MonkeysAudio, OptimFROG, ASF, OggOpus, AAC,
+                   SMF, DSF]

    if not options:
        return None

-    fileobj = open(filename, "rb")
+    fileobj = filething.fileobj
+
    try:
        header = fileobj.read(128)
-        # Sort by name after score. Otherwise import order affects
-        # Kind sort order, which affects treatment of things with
-        # equals scores.
-        results = [(Kind.score(filename, fileobj, header), Kind.__name__)
-                   for Kind in options]
-    finally:
-        fileobj.close()
-    results = list(zip(results, options))
+    except IOError:
+        header = b""
+
+    # Sort by name after score. Otherwise import order affects
+    # Kind sort order, which affects treatment of things with
+    # equals scores.
+    results = [(Kind.score(filething.name, fileobj, header), Kind.__name__)
+               for Kind in options]
+
+    results = list(izip(results, options))
    results.sort()
    (score, name), Kind = results[-1]
    if score > 0:
-        return Kind(filename)
+        try:
+            fileobj.seek(0, 0)
+        except IOError:
+            pass
+        return Kind(fileobj, filename=filething.filename)
    else:
        return None
@@ -0,0 +1 @@
+Don't change things here, this is a copy of https://github.com/lazka/senf
@@ -0,0 +1,82 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import os
+
+if os.name != "nt":
+    # make imports work
+    _winapi = object()
+
+from ._fsnative import fsnative, path2fsn, fsn2text, fsn2bytes, \
+    bytes2fsn, uri2fsn, fsn2uri, text2fsn
+from ._print import print_, input_
+from ._stdlib import sep, pathsep, curdir, pardir, altsep, extsep, devnull, \
+    defpath, getcwd, expanduser, expandvars
+from ._argv import argv
+from ._environ import environ, getenv, unsetenv, putenv
+from ._temp import mkstemp, gettempdir, gettempprefix, mkdtemp
+
+
+fsnative, print_, getcwd, getenv, unsetenv, putenv, environ, expandvars, \
+    path2fsn, fsn2text, fsn2bytes, bytes2fsn, uri2fsn, fsn2uri, mkstemp, \
+    gettempdir, gettempprefix, mkdtemp, input_, expanduser, text2fsn
+
+
+version = (1, 2, 2)
+"""Tuple[`int`, `int`, `int`]: The version tuple (major, minor, micro)"""
+
+
+version_string = ".".join(map(str, version))
+"""`str`: A version string"""
+
+
+argv = argv
+"""List[`fsnative`]: Like `sys.argv` but contains unicode under
+Windows + Python 2
+"""
+
+
+sep = sep
+"""`fsnative`: Like `os.sep` but a `fsnative`"""
+
+
+pathsep = pathsep
+"""`fsnative`: Like `os.pathsep` but a `fsnative`"""
+
+
+curdir = curdir
+"""`fsnative`: Like `os.curdir` but a `fsnative`"""
+
+
+pardir = pardir
+"""`fsnative`: Like `os.pardir` but a fsnative"""
+
+
+altsep = altsep
+"""`fsnative` or `None`: Like `os.altsep` but a `fsnative` or `None`"""
+
+
+extsep = extsep
+"""`fsnative`: Like `os.extsep` but a `fsnative`"""
+
+
+devnull = devnull
+"""`fsnative`: Like `os.devnull` but a `fsnative`"""
+
+
+defpath = defpath
+"""`fsnative`: Like `os.defpath` but a `fsnative`"""
+
+
+__all__ = []
@@ -0,0 +1,109 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import sys
+import ctypes
+import collections
+from functools import total_ordering
+
+from ._compat import PY2, string_types
+from ._fsnative import is_win, _fsn2legacy, path2fsn
+from . import _winapi as winapi
+
+
+def _get_win_argv():
+    """Returns a unicode argv under Windows and standard sys.argv otherwise
+
+    Returns:
+        List[`fsnative`]
+    """
+
+    assert is_win
+
+    argc = ctypes.c_int()
+    try:
+        argv = winapi.CommandLineToArgvW(
+            winapi.GetCommandLineW(), ctypes.byref(argc))
+    except WindowsError:
+        return []
+
+    if not argv:
+        return []
+
+    res = argv[max(0, argc.value - len(sys.argv)):argc.value]
+
+    winapi.LocalFree(argv)
+
+    return res
+
+
+@total_ordering
+class Argv(collections.MutableSequence):
+    """List[`fsnative`]: Like `sys.argv` but contains unicode
+    keys and values under Windows + Python 2.
+
+    Any changes made will be forwarded to `sys.argv`.
+    """
+
+    def __init__(self):
+        if PY2 and is_win:
+            self._argv = _get_win_argv()
+        else:
+            self._argv = sys.argv
+
+    def __getitem__(self, index):
+        return self._argv[index]
+
+    def __setitem__(self, index, value):
+        if isinstance(value, string_types):
+            value = path2fsn(value)
+
+        self._argv[index] = value
+
+        if sys.argv is not self._argv:
+            try:
+                if isinstance(value, string_types):
+                    sys.argv[index] = _fsn2legacy(value)
+                else:
+                    sys.argv[index] = [_fsn2legacy(path2fsn(v)) for v in value]
+            except IndexError:
+                pass
+
+    def __delitem__(self, index):
+        del self._argv[index]
+        try:
+            del sys.argv[index]
+        except IndexError:
+            pass
+
+    def __eq__(self, other):
+        return self._argv == other
+
+    def __lt__(self, other):
+        return self._argv < other
+
+    def __len__(self):
+        return len(self._argv)
+
+    def __repr__(self):
+        return repr(self._argv)
+
+    def insert(self, index, value):
+        value = path2fsn(value)
+        self._argv.insert(index, value)
+        if sys.argv is not self._argv:
+            sys.argv.insert(index, _fsn2legacy(value))
+
+
+argv = Argv()
@@ -0,0 +1,52 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import sys
+
+
+PY2 = sys.version_info[0] == 2
+PY3 = not PY2
+
+
+if PY2:
+    from urlparse import urlparse, urlunparse
+    urlparse, urlunparse
+    from urllib import pathname2url, url2pathname, quote, unquote
+    pathname2url, url2pathname, quote, unquote
+
+    from StringIO import StringIO
+    BytesIO = StringIO
+    from io import StringIO as TextIO
+    TextIO
+
+    string_types = (str, unicode)
+    text_type = unicode
+
+    iteritems = lambda d: d.iteritems()
+elif PY3:
+    from urllib.parse import urlparse, quote, unquote, urlunparse
+    urlparse, quote, unquote, urlunparse
+    from urllib.request import pathname2url, url2pathname
+    pathname2url, url2pathname
+
+    from io import StringIO
+    StringIO = StringIO
+    TextIO = StringIO
+    from io import BytesIO
+    BytesIO = BytesIO
+
+    string_types = (str,)
+    text_type = str
+
+    iteritems = lambda d: iter(d.items())
@@ -0,0 +1,259 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import os
+import ctypes
+import collections
+
+from ._compat import text_type, PY2
+from ._fsnative import path2fsn, is_win, _fsn2legacy, fsnative
+from . import _winapi as winapi
+
+
+def get_windows_env_var(key):
+    """Get an env var.
+
+    Raises:
+        WindowsError
+    """
+
+    if not isinstance(key, text_type):
+        raise TypeError("%r not of type %r" % (key, text_type))
+
+    buf = ctypes.create_unicode_buffer(32767)
+
+    stored = winapi.GetEnvironmentVariableW(key, buf, 32767)
+    if stored == 0:
+        raise ctypes.WinError()
+    return buf[:stored]
+
+
+def set_windows_env_var(key, value):
+    """Set an env var.
+
+    Raises:
+        WindowsError
+    """
+
+    if not isinstance(key, text_type):
+        raise TypeError("%r not of type %r" % (key, text_type))
+
+    if not isinstance(value, text_type):
+        raise TypeError("%r not of type %r" % (value, text_type))
+
+    status = winapi.SetEnvironmentVariableW(key, value)
+    if status == 0:
+        raise ctypes.WinError()
+
+
+def del_windows_env_var(key):
+    """Delete an env var.
+
+    Raises:
+        WindowsError
+    """
+
+    if not isinstance(key, text_type):
+        raise TypeError("%r not of type %r" % (key, text_type))
+
+    status = winapi.SetEnvironmentVariableW(key, None)
+    if status == 0:
+        raise ctypes.WinError()
+
+
+def read_windows_environ():
+    """Returns a unicode dict of the Windows environment.
+
+    Raises:
+        WindowsEnvironError
+    """
+
+    res = winapi.GetEnvironmentStringsW()
+    if not res:
+        raise ctypes.WinError()
+
+    res = ctypes.cast(res, ctypes.POINTER(ctypes.c_wchar))
+
+    done = []
+    current = u""
+    i = 0
+    while 1:
+        c = res[i]
+        i += 1
+        if c == u"\x00":
+            if not current:
+                break
+            done.append(current)
+            current = u""
+            continue
+        current += c
+
+    dict_ = {}
+    for entry in done:
+        try:
+            key, value = entry.split(u"=", 1)
+        except ValueError:
+            continue
+        key = _norm_key(key)
+        dict_[key] = value
+
+    status = winapi.FreeEnvironmentStringsW(res)
+    if status == 0:
+        raise ctypes.WinError()
+
+    return dict_
+
+
+def _norm_key(key):
+    assert isinstance(key, fsnative)
+    if is_win:
+        key = key.upper()
+    return key
+
+
+class Environ(collections.MutableMapping):
+    """Dict[`fsnative`, `fsnative`]: Like `os.environ` but contains unicode
+    keys and values under Windows + Python 2.
+
+    Any changes made will be forwarded to `os.environ`.
+    """
+
+    def __init__(self):
+        if is_win and PY2:
+            try:
+                env = read_windows_environ()
+            except WindowsError:
+                env = {}
+        else:
+            env = os.environ
+        self._env = env
+
+    def __getitem__(self, key):
+        key = _norm_key(path2fsn(key))
+        return self._env[key]
+
+    def __setitem__(self, key, value):
+        key = _norm_key(path2fsn(key))
+        value = path2fsn(value)
+
+        if is_win and PY2:
+            # this calls putenv, so do it first and replace later
+            try:
+                os.environ[_fsn2legacy(key)] = _fsn2legacy(value)
+            except OSError:
+                raise ValueError
+
+            try:
+                set_windows_env_var(key, value)
+            except WindowsError:
+                # py3+win fails for invalid keys. try to do the same
+                raise ValueError
+        try:
+            self._env[key] = value
+        except OSError:
+            raise ValueError
+
+    def __delitem__(self, key):
+        key = _norm_key(path2fsn(key))
+
+        if is_win and PY2:
+            try:
+                del_windows_env_var(key)
+            except WindowsError:
+                pass
+
+            try:
+                del os.environ[_fsn2legacy(key)]
+            except KeyError:
+                pass
+
+        del self._env[key]
+
+    def __iter__(self):
+        return iter(self._env)
+
+    def __len__(self):
+        return len(self._env)
+
+    def __repr__(self):
+        return repr(self._env)
+
+    def copy(self):
+        return self._env.copy()
+
+
+environ = Environ()
+
+
+def getenv(key, value=None):
+    """Like `os.getenv` but returns unicode under Windows + Python 2
+
+    Args:
+        key (pathlike): The env var to get
+        value (object): The value to return if the env var does not exist
+    Returns:
+        `fsnative` or `object`:
+            The env var or the passed value if it doesn't exist
+    """
+
+    key = path2fsn(key)
+    if is_win and PY2:
+        return environ.get(key, value)
+    return os.getenv(key, value)
+
+
+def unsetenv(key):
+    """Like `os.unsetenv` but takes unicode under Windows + Python 2
+
+    Args:
+        key (pathlike): The env var to unset
+    """
+
+    key = path2fsn(key)
+    if is_win:
+        # python 3 has no unsetenv under Windows -> use our ctypes one as well
+        try:
+            del_windows_env_var(key)
+        except WindowsError:
+            pass
+    else:
+        os.unsetenv(key)
+
+
+def putenv(key, value):
+    """Like `os.putenv` but takes unicode under Windows + Python 2
+
+    Args:
+        key (pathlike): The env var to get
+        value (pathlike): The value to set
+    Raises:
+        ValueError
+    """
+
+    key = path2fsn(key)
+    value = path2fsn(value)
+
+    if is_win and PY2:
+        try:
+            set_windows_env_var(key, value)
+        except WindowsError:
+            # py3 + win fails here
+            raise ValueError
+    else:
+        try:
+            os.putenv(key, value)
+        except OSError:
+            # win + py3 raise here for invalid keys which is probably a bug.
+            # ValueError seems better
+            raise ValueError
@@ -0,0 +1,610 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import os
+import sys
+import ctypes
+import codecs
+
+from . import _winapi as winapi
+from ._compat import text_type, PY3, PY2, url2pathname, urlparse, quote, \
+    unquote, urlunparse
+
+
+is_win = os.name == "nt"
+is_unix = not is_win
+is_darwin = sys.platform == "darwin"
+
+_surrogatepass = "strict" if PY2 else "surrogatepass"
+
+
+def _normalize_codec(codec, _cache={}):
+    """Raises LookupError"""
+
+    try:
+        return _cache[codec]
+    except KeyError:
+        _cache[codec] = codecs.lookup(codec).name
+        return _cache[codec]
+
+
+def _swap_bytes(data):
+    """swaps bytes for 16 bit, leaves remaining trailing bytes alone"""
+
+    a, b = data[1::2], data[::2]
+    data = bytearray().join(bytearray(x) for x in zip(a, b))
+    if len(b) > len(a):
+        data += b[-1:]
+    return bytes(data)
+
+
+def _codec_fails_on_encode_surrogates(codec, _cache={}):
+    """Returns if a codec fails correctly when passing in surrogates with
+    a surrogatepass/surrogateescape error handler. Some codecs were broken
+    in Python <3.4
+    """
+
+    try:
+        return _cache[codec]
+    except KeyError:
+        try:
+            u"\uD800\uDC01".encode(codec)
+        except UnicodeEncodeError:
+            _cache[codec] = True
+        else:
+            _cache[codec] = False
+        return _cache[codec]
+
+
+def _codec_can_decode_with_surrogatepass(codec, _cache={}):
+    """Returns if a codec supports the surrogatepass error handler when
+    decoding. Some codecs were broken in Python <3.4
+    """
+
+    try:
+        return _cache[codec]
+    except KeyError:
+        try:
+            u"\ud83d".encode(
+                codec, _surrogatepass).decode(codec, _surrogatepass)
+        except UnicodeDecodeError:
+            _cache[codec] = False
+        else:
+            _cache[codec] = True
+        return _cache[codec]
+
+
+def _bytes2winpath(data, codec):
+    """Like data.decode(codec, 'surrogatepass') but makes utf-16-le/be work
+    on Python < 3.4 + Windows
+
+    https://bugs.python.org/issue27971
+
+    Raises UnicodeDecodeError, LookupError
+    """
+
+    try:
+        return data.decode(codec, _surrogatepass)
+    except UnicodeDecodeError:
+        if not _codec_can_decode_with_surrogatepass(codec):
+            if _normalize_codec(codec) == "utf-16-be":
+                data = _swap_bytes(data)
+                codec = "utf-16-le"
+            if _normalize_codec(codec) == "utf-16-le":
+                buffer_ = ctypes.create_string_buffer(data + b"\x00\x00")
+                value = ctypes.wstring_at(buffer_, len(data) // 2)
+                if value.encode("utf-16-le", _surrogatepass) != data:
+                    raise
+                return value
+            else:
+                raise
+        else:
+            raise
+
+
+def _winpath2bytes_py3(text, codec):
+    """Fallback implementation for text including surrogates"""
+
+    # merge surrogate codepoints
+    if _normalize_codec(codec).startswith("utf-16"):
+        # fast path, utf-16 merges anyway
+        return text.encode(codec, _surrogatepass)
+    return _bytes2winpath(
+        text.encode("utf-16-le", _surrogatepass),
+        "utf-16-le").encode(codec, _surrogatepass)
+
+
+if PY2:
+    def _winpath2bytes(text, codec):
+        return text.encode(codec)
+else:
+    def _winpath2bytes(text, codec):
+        if _codec_fails_on_encode_surrogates(codec):
+            try:
+                return text.encode(codec)
+            except UnicodeEncodeError:
+                return _winpath2bytes_py3(text, codec)
+        else:
+            return _winpath2bytes_py3(text, codec)
+
+
+def _fsn2legacy(path):
+    """Takes a fsnative path and returns a path that can be put into os.environ
+    or sys.argv. Might result in a mangled path on Python2 + Windows.
+    Can't fail.
+
+    Args:
+        path (fsnative)
+    Returns:
+        str
+    """
+
+    if PY2 and is_win:
+        return path.encode(_encoding, "replace")
+    return path
+
+
+def _fsnative(text):
+    if not isinstance(text, text_type):
+        raise TypeError("%r needs to be a text type (%r)" % (text, text_type))
+
+    if is_unix:
+        # First we go to bytes so we can be sure we have a valid source.
+        # Theoretically we should fail here in case we have a non-unicode
+        # encoding. But this would make everything complicated and there is
+        # no good way to handle a failure from the user side. Instead
+        # fall back to utf-8 which is the most likely the right choice in
+        # a mis-configured environment
+        encoding = _encoding
+        try:
+            path = text.encode(encoding, _surrogatepass)
+        except UnicodeEncodeError:
+            path = text.encode("utf-8", _surrogatepass)
+
+        if b"\x00" in path:
+            path = path.replace(b"\x00", fsn2bytes(_fsnative(u"\uFFFD"), None))
+
+        if PY3:
+            return path.decode(_encoding, "surrogateescape")
+        return path
+    else:
+        if u"\x00" in text:
+            text = text.replace(u"\x00", u"\uFFFD")
+        return text
+
+
+def _create_fsnative(type_):
+    # a bit of magic to make fsnative(u"foo") and isinstance(path, fsnative)
+    # work
+
+    class meta(type):
+
+        def __instancecheck__(self, instance):
+            return _typecheck_fsnative(instance)
+
+        def __subclasscheck__(self, subclass):
+            return issubclass(subclass, type_)
+
+    class impl(object):
+        """fsnative(text=u"")
+
+        Args:
+            text (text): The text to convert to a path
+        Returns:
+            fsnative: The new path.
+        Raises:
+            TypeError: In case something other then `text` has been passed
+
+        This type is a virtual base class for the real path type.
+        Instantiating it returns an instance of the real path type and it
+        overrides instance and subclass checks so that `isinstance` and
+        `issubclass` checks work:
+
+        ::
+
+            isinstance(fsnative(u"foo"), fsnative) == True
+            issubclass(type(fsnative(u"foo")), fsnative) == True
+
+        The real returned type is:
+
+        - **Python 2 + Windows:** :obj:`python:unicode`, with ``surrogates``,
+          without ``null``
+        - **Python 2 + Unix:** :obj:`python:str`, without ``null``
+        - **Python 3 + Windows:** :obj:`python3:str`, with ``surrogates``,
+          without ``null``
+        - **Python 3 + Unix:** :obj:`python3:str`, with ``surrogates``, without
+          ``null``, without code points not encodable with the locale encoding
+
+        Constructing a `fsnative` can't fail.
+
+        Passing a `fsnative` to :func:`open` will never lead to `ValueError`
+        or `TypeError`.
+
+        Any operation on `fsnative` can also use the `str` type, as long as
+        the `str` only contains ASCII and no NULL.
+        """
+
+        def __new__(cls, text=u""):
+            return _fsnative(text)
+
+    new_type = meta("fsnative", (object,), dict(impl.__dict__))
+    new_type.__module__ = "senf"
+    return new_type
+
+
+fsnative_type = text_type if is_win or PY3 else bytes
+fsnative = _create_fsnative(fsnative_type)
+
+
+def _typecheck_fsnative(path):
+    """
+    Args:
+        path (object)
+    Returns:
+        bool: if path is a fsnative
+    """
+
+    if not isinstance(path, fsnative_type):
+        return False
+
+    if PY3 or is_win:
+        if u"\x00" in path:
+            return False
+
+        if is_unix and not _is_unicode_encoding:
+            try:
+                path.encode(_encoding, "surrogateescape")
+            except UnicodeEncodeError:
+                return False
+    elif b"\x00" in path:
+        return False
+
+    return True
+
+
+def _fsn2native(path):
+    """
+    Args:
+        path (fsnative)
+    Returns:
+        `text` on Windows, `bytes` on Unix
+    Raises:
+        TypeError: in case the type is wrong or the ´str` on Py3 + Unix
+            can't be converted to `bytes`
+
+    This helper allows to validate the type and content of a path.
+    To reduce overhead the encoded value for Py3 + Unix is returned so
+    it can be reused.
+    """
+
+    if not isinstance(path, fsnative_type):
+        raise TypeError("path needs to be %s, not %s" % (
+            fsnative_type.__name__, type(path).__name__))
+
+    if is_unix:
+        if PY3:
+            try:
+                path = path.encode(_encoding, "surrogateescape")
+            except UnicodeEncodeError:
+                assert not _is_unicode_encoding
+                # This look more like ValueError, but raising only one error
+                # makes things simpler... also one could say str + surrogates
+                # is its own type
+                raise TypeError(
+                    "path contained Unicode code points not valid in"
+                    "the current path encoding. To create a valid "
+                    "path from Unicode use text2fsn()")
+
+        if b"\x00" in path:
+            raise TypeError("fsnative can't contain nulls")
+    else:
+        if u"\x00" in path:
+            raise TypeError("fsnative can't contain nulls")
+
+    return path
+
+
+def _get_encoding():
+    """The encoding used for paths, argv, environ, stdout and stdin"""
+
+    encoding = sys.getfilesystemencoding()
+    if encoding is None:
+        if is_darwin:
+            encoding = "utf-8"
+        elif is_win:
+            encoding = "mbcs"
+        else:
+            encoding = "ascii"
+    encoding = _normalize_codec(encoding)
+    return encoding
+
+
+_encoding = _get_encoding()
+_is_unicode_encoding = _encoding.startswith("utf")
+
+
+def path2fsn(path):
+    """
+    Args:
+        path (pathlike): The path to convert
+    Returns:
+        `fsnative`
+    Raises:
+        TypeError: In case the type can't be converted to a `fsnative`
+        ValueError: In case conversion fails
+
+    Returns a `fsnative` path for a `pathlike`.
+    """
+
+    # allow mbcs str on py2+win and bytes on py3
+    if PY2:
+        if is_win:
+            if isinstance(path, bytes):
+                path = path.decode(_encoding)
+        else:
+            if isinstance(path, text_type):
+                path = path.encode(_encoding)
+        if "\x00" in path:
+            raise ValueError("embedded null")
+    else:
+        path = getattr(os, "fspath", lambda x: x)(path)
+        if isinstance(path, bytes):
+            if b"\x00" in path:
+                raise ValueError("embedded null")
+            path = path.decode(_encoding, "surrogateescape")
+        elif is_unix and isinstance(path, str):
+            # make sure we can encode it and this is not just some random
+            # unicode string
+            data = path.encode(_encoding, "surrogateescape")
+            if b"\x00" in data:
+                raise ValueError("embedded null")
+        else:
+            if u"\x00" in path:
+                raise ValueError("embedded null")
+
+    if not isinstance(path, fsnative_type):
+        raise TypeError("path needs to be %s", fsnative_type.__name__)
+
+    return path
+
+
+def fsn2text(path, strict=False):
+    """
+    Args:
+        path (fsnative): The path to convert
+        strict (bool): Fail in case the conversion is not reversible
+    Returns:
+        `text`
+    Raises:
+        TypeError: In case no `fsnative` has been passed
+        ValueError: In case ``strict`` was True and the conversion failed
+
+    Converts a `fsnative` path to `text`.
+
+    Can be used to pass a path to some unicode API, like for example a GUI
+    toolkit.
+
+    If ``strict`` is True the conversion will fail in case it is not
+    reversible. This can be useful for converting program arguments that are
+    supposed to be text and erroring out in case they are not.
+
+    Encoding with a Unicode encoding will always succeed with the result.
+    """
+
+    path = _fsn2native(path)
+
+    errors = "strict" if strict else "replace"
+
+    if is_win:
+        return path.encode("utf-16-le", _surrogatepass).decode("utf-16-le",
+                                                               errors)
+    else:
+        return path.decode(_encoding, errors)
+
+
+def text2fsn(text):
+    """
+    Args:
+        text (text): The text to convert
+    Returns:
+        `fsnative`
+    Raises:
+        TypeError: In case no `text` has been passed
+
+    Takes `text` and converts it to a `fsnative`.
+
+    This operation is not reversible and can't fail.
+    """
+
+    return fsnative(text)
+
+
+def fsn2bytes(path, encoding):
+    """
+    Args:
+        path (fsnative): The path to convert
+        encoding (`str` or `None`): `None` if you don't care about Windows
+    Returns:
+        `bytes`
+    Raises:
+        TypeError: If no `fsnative` path is passed
+        ValueError: If encoding fails or no encoding is given
+
+    Converts a `fsnative` path to `bytes`.
+
+    The passed *encoding* is only used on platforms where paths are not
+    associated with an encoding (Windows for example). If you don't care about
+    Windows you can pass `None`.
+
+    For Windows paths, lone surrogates will be encoded like normal code points
+    and surrogate pairs will be merged before encoding. In case of ``utf-8``
+    or ``utf-16-le`` this is equal to the `WTF-8 and WTF-16 encoding
+    <https://simonsapin.github.io/wtf-8/>`__.
+    """
+
+    path = _fsn2native(path)
+
+    if is_win:
+        if encoding is None:
+            raise ValueError("invalid encoding %r" % encoding)
+
+        try:
+            return _winpath2bytes(path, encoding)
+        except LookupError:
+            raise ValueError("invalid encoding %r" % encoding)
+    else:
+        return path
+
+
+def bytes2fsn(data, encoding):
+    """
+    Args:
+        data (bytes): The data to convert
+        encoding (`str` or `None`): `None` if you don't care about Windows
+    Returns:
+        `fsnative`
+    Raises:
+        TypeError: If no `bytes` path is passed
+        ValueError: If decoding fails or no encoding is given
+
+    Turns `bytes` to a `fsnative` path.
+
+    The passed *encoding* is only used on platforms where paths are not
+    associated with an encoding (Windows for example). If you don't care about
+    Windows you can pass `None`.
+    """
+
+    if not isinstance(data, bytes):
+        raise TypeError("data needs to be bytes")
+
+    if is_win:
+        if encoding is None:
+            raise ValueError("invalid encoding %r" % encoding)
+        try:
+            path = _bytes2winpath(data, encoding)
+        except LookupError:
+            raise ValueError("invalid encoding %r" % encoding)
+        if u"\x00" in path:
+            raise ValueError("contains nulls")
+        return path
+    else:
+        if b"\x00" in data:
+            raise ValueError("contains nulls")
+        if PY2:
+            return data
+        else:
+            return data.decode(_encoding, "surrogateescape")
+
+
+def uri2fsn(uri):
+    """
+    Args:
+        uri (`text` or :obj:`python:str`): A file URI
+    Returns:
+        `fsnative`
+    Raises:
+        TypeError: In case an invalid type is passed
+        ValueError: In case the URI isn't a valid file URI
+
+    Takes a file URI and returns a `fsnative` path
+    """
+
+    if PY2:
+        if isinstance(uri, text_type):
+            uri = uri.encode("utf-8")
+        if not isinstance(uri, bytes):
+            raise TypeError("uri needs to be ascii str or unicode")
+    else:
+        if not isinstance(uri, str):
+            raise TypeError("uri needs to be str")
+
+    parsed = urlparse(uri)
+    scheme = parsed.scheme
+    netloc = parsed.netloc
+    path = parsed.path
+
+    if scheme != "file":
+        raise ValueError("Not a file URI: %r" % uri)
+
+    if not path:
+        raise ValueError("Invalid file URI: %r" % uri)
+
+    uri = urlunparse(parsed)[7:]
+
+    if is_win:
+        path = url2pathname(uri)
+        if netloc:
+            path = "\\\\" + path
+        if PY2:
+            path = path.decode("utf-8")
+        if u"\x00" in path:
+            raise ValueError("embedded null")
+        return path
+    else:
+        path = url2pathname(uri)
+        if "\x00" in path:
+            raise ValueError("embedded null")
+        if PY3:
+            path = fsnative(path)
+        return path
+
+
+def fsn2uri(path):
+    """
+    Args:
+        path (fsnative): The path to convert to an URI
+    Returns:
+        `text`: An ASCII only URI
+    Raises:
+        TypeError: If no `fsnative` was passed
+        ValueError: If the path can't be converted
+
+    Takes a `fsnative` path and returns a file URI.
+
+    On Windows non-ASCII characters will be encoded using utf-8 and then
+    percent encoded.
+    """
+
+    path = _fsn2native(path)
+
+    def _quote_path(path):
+        # RFC 2396
+        path = quote(path, "/:@&=+$,")
+        if PY2:
+            path = path.decode("ascii")
+        return path
+
+    if is_win:
+        buf = ctypes.create_unicode_buffer(winapi.INTERNET_MAX_URL_LENGTH)
+        length = winapi.DWORD(winapi.INTERNET_MAX_URL_LENGTH)
+        flags = 0
+        try:
+            winapi.UrlCreateFromPathW(path, buf, ctypes.byref(length), flags)
+        except WindowsError as e:
+            raise ValueError(e)
+        uri = buf[:length.value]
+
+        # For some reason UrlCreateFromPathW escapes some chars outside of
+        # ASCII and some not. Unquote and re-quote with utf-8.
+        if PY3:
+            # latin-1 maps code points directly to bytes, which is what we want
+            uri = unquote(uri, "latin-1")
+        else:
+            # Python 2 does what we want by default
+            uri = unquote(uri)
+
+        return _quote_path(uri.encode("utf-8", _surrogatepass))
+
+    else:
+        return u"file://" + _quote_path(path)
@@ -0,0 +1,353 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import sys
+import os
+import ctypes
+
+from ._fsnative import _encoding, is_win, is_unix, _surrogatepass
+from ._compat import text_type, PY2, PY3
+from ._winansi import AnsiState, ansi_split
+from . import _winapi as winapi
+
+
+def print_(*objects, **kwargs):
+    """print_(*objects, sep=None, end=None, file=None, flush=False)
+
+    Args:
+        objects (object): zero or more objects to print
+        sep (str): Object separator to use, defaults to ``" "``
+        end (str): Trailing string to use, defaults to ``"\\n"``.
+            If end is ``"\\n"`` then `os.linesep` is used.
+        file (object): A file-like object, defaults to `sys.stdout`
+        flush (bool): If the file stream should be flushed
+    Raises:
+        EnvironmentError
+
+    Like print(), but:
+
+    * Supports printing filenames under Unix + Python 3 and Windows + Python 2
+    * Emulates ANSI escape sequence support under Windows
+    * Never fails due to encoding/decoding errors. Tries hard to get everything
+      on screen as is, but will fall back to "?" if all fails.
+
+    This does not conflict with ``colorama``, but will not use it on Windows.
+    """
+
+    sep = kwargs.get("sep")
+    sep = sep if sep is not None else " "
+    end = kwargs.get("end")
+    end = end if end is not None else "\n"
+    file = kwargs.get("file")
+    file = file if file is not None else sys.stdout
+    flush = bool(kwargs.get("flush", False))
+
+    if is_win:
+        _print_windows(objects, sep, end, file, flush)
+    else:
+        _print_unix(objects, sep, end, file, flush)
+
+
+def _print_unix(objects, sep, end, file, flush):
+    """A print_() implementation which writes bytes"""
+
+    encoding = _encoding
+
+    if isinstance(sep, text_type):
+        sep = sep.encode(encoding, "replace")
+    if not isinstance(sep, bytes):
+        raise TypeError
+
+    if isinstance(end, text_type):
+        end = end.encode(encoding, "replace")
+    if not isinstance(end, bytes):
+        raise TypeError
+
+    if end == b"\n":
+        end = os.linesep
+        if PY3:
+            end = end.encode("ascii")
+
+    parts = []
+    for obj in objects:
+        if not isinstance(obj, text_type) and not isinstance(obj, bytes):
+            obj = text_type(obj)
+        if isinstance(obj, text_type):
+            if PY2:
+                obj = obj.encode(encoding, "replace")
+            else:
+                try:
+                    obj = obj.encode(encoding, "surrogateescape")
+                except UnicodeEncodeError:
+                    obj = obj.encode(encoding, "replace")
+        assert isinstance(obj, bytes)
+        parts.append(obj)
+
+    data = sep.join(parts) + end
+    assert isinstance(data, bytes)
+
+    file = getattr(file, "buffer", file)
+
+    try:
+        file.write(data)
+    except TypeError:
+        if PY3:
+            # For StringIO, first try with surrogates
+            surr_data = data.decode(encoding, "surrogateescape")
+            try:
+                file.write(surr_data)
+            except (TypeError, ValueError):
+                file.write(data.decode(encoding, "replace"))
+        else:
+            # for file like objects with don't support bytes
+            file.write(data.decode(encoding, "replace"))
+
+    if flush:
+        file.flush()
+
+
+ansi_state = AnsiState()
+
+
+def _print_windows(objects, sep, end, file, flush):
+    """The windows implementation of print_()"""
+
+    h = winapi.INVALID_HANDLE_VALUE
+
+    try:
+        fileno = file.fileno()
+    except (EnvironmentError, AttributeError):
+        pass
+    else:
+        if fileno == 1:
+            h = winapi.GetStdHandle(winapi.STD_OUTPUT_HANDLE)
+        elif fileno == 2:
+            h = winapi.GetStdHandle(winapi.STD_ERROR_HANDLE)
+
+    encoding = _encoding
+
+    parts = []
+    for obj in objects:
+        if isinstance(obj, bytes):
+            obj = obj.decode(encoding, "replace")
+        if not isinstance(obj, text_type):
+            obj = text_type(obj)
+        parts.append(obj)
+
+    if isinstance(sep, bytes):
+        sep = sep.decode(encoding, "replace")
+    if not isinstance(sep, text_type):
+        raise TypeError
+
+    if isinstance(end, bytes):
+        end = end.decode(encoding, "replace")
+    if not isinstance(end, text_type):
+        raise TypeError
+
+    if end == u"\n":
+        end = os.linesep
+
+    text = sep.join(parts) + end
+    assert isinstance(text, text_type)
+
+    is_console = True
+    if h == winapi.INVALID_HANDLE_VALUE:
+        is_console = False
+    else:
+        # get the default value
+        info = winapi.CONSOLE_SCREEN_BUFFER_INFO()
+        if not winapi.GetConsoleScreenBufferInfo(h, ctypes.byref(info)):
+            is_console = False
+
+    if is_console:
+        # make sure we flush before we apply any console attributes
+        file.flush()
+
+        # try to force a utf-8 code page, use the output CP if that fails
+        cp = winapi.GetConsoleOutputCP()
+        try:
+            encoding = "utf-8"
+            if winapi.SetConsoleOutputCP(65001) == 0:
+                encoding = None
+
+            for is_ansi, part in ansi_split(text):
+                if is_ansi:
+                    ansi_state.apply(h, part)
+                else:
+                    if encoding is not None:
+                        data = part.encode(encoding, _surrogatepass)
+                    else:
+                        data = _encode_codepage(cp, part)
+                    os.write(fileno, data)
+        finally:
+            # reset the code page to what we had before
+            winapi.SetConsoleOutputCP(cp)
+    else:
+        # try writing bytes first, so in case of Python 2 StringIO we get
+        # the same type on all platforms
+        try:
+            file.write(text.encode("utf-8", _surrogatepass))
+        except (TypeError, ValueError):
+            file.write(text)
+
+        if flush:
+            file.flush()
+
+
+def _readline_windows():
+    """Raises OSError"""
+
+    try:
+        fileno = sys.stdin.fileno()
+    except (EnvironmentError, AttributeError):
+        fileno = -1
+
+    # In case stdin is replaced, read from that
+    if fileno != 0:
+        return _readline_windows_fallback()
+
+    h = winapi.GetStdHandle(winapi.STD_INPUT_HANDLE)
+    if h == winapi.INVALID_HANDLE_VALUE:
+        return _readline_windows_fallback()
+
+    buf_size = 1024
+    buf = ctypes.create_string_buffer(buf_size * ctypes.sizeof(winapi.WCHAR))
+    read = winapi.DWORD()
+
+    text = u""
+    while True:
+        if winapi.ReadConsoleW(
+                h, buf, buf_size, ctypes.byref(read), None) == 0:
+            if not text:
+                return _readline_windows_fallback()
+            raise ctypes.WinError()
+        data = buf[:read.value * ctypes.sizeof(winapi.WCHAR)]
+        text += data.decode("utf-16-le", _surrogatepass)
+        if text.endswith(u"\r\n"):
+            return text[:-2]
+
+
+def _decode_codepage(codepage, data):
+    """
+    Args:
+        codepage (int)
+        data (bytes)
+    Returns:
+        `text`
+
+    Decodes data using the given codepage. If some data can't be decoded
+    using the codepage it will not fail.
+    """
+
+    assert isinstance(data, bytes)
+
+    if not data:
+        return u""
+
+    # get the required buffer length first
+    length = winapi.MultiByteToWideChar(codepage, 0, data, len(data), None, 0)
+    if length == 0:
+        raise ctypes.WinError()
+
+    # now decode
+    buf = ctypes.create_unicode_buffer(length)
+    length = winapi.MultiByteToWideChar(
+        codepage, 0, data, len(data), buf, length)
+    if length == 0:
+        raise ctypes.WinError()
+
+    return buf[:]
+
+
+def _encode_codepage(codepage, text):
+    """
+    Args:
+        codepage (int)
+        text (text)
+    Returns:
+        `bytes`
+
+    Encode text using the given code page. Will not fail if a char
+    can't be encoded using that codepage.
+    """
+
+    assert isinstance(text, text_type)
+
+    if not text:
+        return b""
+
+    size = (len(text.encode("utf-16-le", _surrogatepass)) //
+            ctypes.sizeof(winapi.WCHAR))
+
+    # get the required buffer size
+    length = winapi.WideCharToMultiByte(
+        codepage, 0, text, size, None, 0, None, None)
+    if length == 0:
+        raise ctypes.WinError()
+
+    # decode to the buffer
+    buf = ctypes.create_string_buffer(length)
+    length = winapi.WideCharToMultiByte(
+        codepage, 0, text, size, buf, length, None, None)
+    if length == 0:
+        raise ctypes.WinError()
+    return buf[:length]
+
+
+def _readline_windows_fallback():
+    # In case reading from the console failed (maybe we get piped data)
+    # we assume the input was generated according to the output encoding.
+    # Got any better ideas?
+    assert is_win
+    cp = winapi.GetConsoleOutputCP()
+    data = getattr(sys.stdin, "buffer", sys.stdin).readline().rstrip(b"\r\n")
+    return _decode_codepage(cp, data)
+
+
+def _readline_default():
+    assert is_unix
+    data = getattr(sys.stdin, "buffer", sys.stdin).readline().rstrip(b"\r\n")
+    if PY3:
+        return data.decode(_encoding, "surrogateescape")
+    else:
+        return data
+
+
+def _readline():
+    if is_win:
+        return _readline_windows()
+    else:
+        return _readline_default()
+
+
+def input_(prompt=None):
+    """
+    Args:
+        prompt (object): Prints the passed object to stdout without
+            adding a trailing newline
+    Returns:
+        `fsnative`
+    Raises:
+        EnvironmentError
+
+    Like :func:`python3:input` but returns a `fsnative` and allows printing
+    filenames as prompt to stdout.
+
+    Use :func:`fsn2text` on the result if you just want to deal with text.
+    """
+
+    if prompt is not None:
+        print_(prompt, end="")
+
+    return _readline()
@@ -0,0 +1,146 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import re
+import os
+
+from ._fsnative import path2fsn, fsnative, is_win
+from ._compat import PY2
+from ._environ import environ
+
+
+sep = path2fsn(os.sep)
+pathsep = path2fsn(os.pathsep)
+curdir = path2fsn(os.curdir)
+pardir = path2fsn(os.pardir)
+altsep = path2fsn(os.altsep) if os.altsep is not None else None
+extsep = path2fsn(os.extsep)
+devnull = path2fsn(os.devnull)
+defpath = path2fsn(os.defpath)
+
+
+def getcwd():
+    """Like `os.getcwd` but returns a `fsnative` path
+
+    Returns:
+        `fsnative`
+    """
+
+    if is_win and PY2:
+        return os.getcwdu()
+    return os.getcwd()
+
+
+def _get_userdir(user=None):
+    """Returns the user dir or None"""
+
+    if user is not None and not isinstance(user, fsnative):
+        raise TypeError
+
+    if is_win:
+        if "HOME" in environ:
+            path = environ["HOME"]
+        elif "USERPROFILE" in environ:
+            path = environ["USERPROFILE"]
+        elif "HOMEPATH" in environ and "HOMEDRIVE" in environ:
+            path = os.path.join(environ["HOMEDRIVE"], environ["HOMEPATH"])
+        else:
+            return
+
+        if user is None:
+            return path
+        else:
+            return os.path.join(os.path.dirname(path), user)
+    else:
+        import pwd
+
+        if user is None:
+            if "HOME" in environ:
+                return environ["HOME"]
+            else:
+                try:
+                    return path2fsn(pwd.getpwuid(os.getuid()).pw_dir)
+                except KeyError:
+                    return
+        else:
+            try:
+                return path2fsn(pwd.getpwnam(user).pw_dir)
+            except KeyError:
+                return
+
+
+def expanduser(path):
+    """
+    Args:
+        path (pathlike): A path to expand
+    Returns:
+        `fsnative`
+
+    Like :func:`python:os.path.expanduser` but supports unicode home
+    directories under Windows + Python 2 and always returns a `fsnative`.
+    """
+
+    path = path2fsn(path)
+
+    if path == "~":
+        return _get_userdir()
+    elif path.startswith("~" + sep) or (
+            altsep is not None and path.startswith("~" + altsep)):
+        userdir = _get_userdir()
+        if userdir is None:
+            return path
+        return userdir + path[1:]
+    elif path.startswith("~"):
+        sep_index = path.find(sep)
+        if altsep is not None:
+            alt_index = path.find(altsep)
+            if alt_index != -1 and alt_index < sep_index:
+                sep_index = alt_index
+
+        if sep_index == -1:
+            user = path[1:]
+            rest = ""
+        else:
+            user = path[1:sep_index]
+            rest = path[sep_index:]
+
+        userdir = _get_userdir(user)
+        if userdir is not None:
+            return userdir + rest
+        else:
+            return path
+    else:
+        return path
+
+
+def expandvars(path):
+    """
+    Args:
+        path (pathlike): A path to expand
+    Returns:
+        `fsnative`
+
+    Like :func:`python:os.path.expandvars` but supports unicode under Windows
+    + Python 2 and always returns a `fsnative`.
+    """
+
+    path = path2fsn(path)
+
+    def repl_func(match):
+        return environ.get(match.group(1), match.group(0))
+
+    path = re.compile(r"\$(\w+)", flags=re.UNICODE).sub(repl_func, path)
+    if os.name == "nt":
+        path = re.sub(r"%([^%]+)%", repl_func, path)
+    return re.sub(r"\$\{([^\}]+)\}", repl_func, path)
@@ -0,0 +1,88 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import tempfile
+
+from ._fsnative import path2fsn, fsnative
+
+
+def gettempdir():
+    """
+    Returns:
+        `fsnative`
+
+    Like :func:`python3:tempfile.gettempdir`, but always returns a `fsnative`
+    path
+    """
+
+    # FIXME: I don't want to reimplement all that logic, reading env vars etc.
+    # At least for the default it works.
+    return path2fsn(tempfile.gettempdir())
+
+
+def gettempprefix():
+    """
+    Returns:
+        `fsnative`
+
+    Like :func:`python3:tempfile.gettempprefix`, but always returns a
+    `fsnative` path
+    """
+
+    return path2fsn(tempfile.gettempprefix())
+
+
+def mkstemp(suffix=None, prefix=None, dir=None, text=False):
+    """
+    Args:
+        suffix (`pathlike` or `None`): suffix or `None` to use the default
+        prefix (`pathlike` or `None`): prefix or `None` to use the default
+        dir (`pathlike` or `None`): temp dir or `None` to use the default
+        text (bool): if the file should be opened in text mode
+    Returns:
+        Tuple[`int`, `fsnative`]:
+            A tuple containing the file descriptor and the file path
+    Raises:
+        EnvironmentError
+
+    Like :func:`python3:tempfile.mkstemp` but always returns a `fsnative`
+    path.
+    """
+
+    suffix = fsnative() if suffix is None else path2fsn(suffix)
+    prefix = gettempprefix() if prefix is None else path2fsn(prefix)
+    dir = gettempdir() if dir is None else path2fsn(dir)
+
+    return tempfile.mkstemp(suffix, prefix, dir, text)
+
+
+def mkdtemp(suffix=None, prefix=None, dir=None):
+    """
+    Args:
+        suffix (`pathlike` or `None`): suffix or `None` to use the default
+        prefix (`pathlike` or `None`): prefix or `None` to use the default
+        dir (`pathlike` or `None`): temp dir or `None` to use the default
+    Returns:
+        `fsnative`: A path to a directory
+    Raises:
+        EnvironmentError
+
+    Like :func:`python3:tempfile.mkstemp` but always returns a `fsnative` path.
+    """
+
+    suffix = fsnative() if suffix is None else path2fsn(suffix)
+    prefix = gettempprefix() if prefix is None else path2fsn(prefix)
+    dir = gettempdir() if dir is None else path2fsn(dir)
+
+    return tempfile.mkdtemp(suffix, prefix, dir)
@@ -0,0 +1,311 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import ctypes
+import re
+import atexit
+
+from . import _winapi as winapi
+
+
+def ansi_parse(code):
+    """Returns command, (args)"""
+
+    return code[-1:], tuple([int(v or "0") for v in code[2:-1].split(";")])
+
+
+def ansi_split(text, _re=re.compile(u"(\x1b\[(\d*;?)*\S)")):
+    """Yields (is_ansi, text)"""
+
+    for part in _re.split(text):
+        if part:
+            yield (bool(_re.match(part)), part)
+
+
+class AnsiCommand(object):
+    TEXT = "m"
+
+    MOVE_UP = "A"
+    MOVE_DOWN = "B"
+    MOVE_FORWARD = "C"
+    MOVE_BACKWARD = "D"
+
+    SET_POS = "H"
+    SET_POS_ALT = "f"
+
+    SAVE_POS = "s"
+    RESTORE_POS = "u"
+
+
+class TextAction(object):
+    RESET_ALL = 0
+
+    SET_BOLD = 1
+    SET_DIM = 2
+    SET_ITALIC = 3
+    SET_UNDERLINE = 4
+    SET_BLINK = 5
+    SET_BLINK_FAST = 6
+    SET_REVERSE = 7
+    SET_HIDDEN = 8
+
+    RESET_BOLD = 21
+    RESET_DIM = 22
+    RESET_ITALIC = 23
+    RESET_UNDERLINE = 24
+    RESET_BLINK = 25
+    RESET_BLINK_FAST = 26
+    RESET_REVERSE = 27
+    RESET_HIDDEN = 28
+
+    FG_BLACK = 30
+    FG_RED = 31
+    FG_GREEN = 32
+    FG_YELLOW = 33
+    FG_BLUE = 34
+    FG_MAGENTA = 35
+    FG_CYAN = 36
+    FG_WHITE = 37
+
+    FG_DEFAULT = 39
+
+    FG_LIGHT_BLACK = 90
+    FG_LIGHT_RED = 91
+    FG_LIGHT_GREEN = 92
+    FG_LIGHT_YELLOW = 93
+    FG_LIGHT_BLUE = 94
+    FG_LIGHT_MAGENTA = 95
+    FG_LIGHT_CYAN = 96
+    FG_LIGHT_WHITE = 97
+
+    BG_BLACK = 40
+    BG_RED = 41
+    BG_GREEN = 42
+    BG_YELLOW = 43
+    BG_BLUE = 44
+    BG_MAGENTA = 45
+    BG_CYAN = 46
+    BG_WHITE = 47
+
+    BG_DEFAULT = 49
+
+    BG_LIGHT_BLACK = 100
+    BG_LIGHT_RED = 101
+    BG_LIGHT_GREEN = 102
+    BG_LIGHT_YELLOW = 103
+    BG_LIGHT_BLUE = 104
+    BG_LIGHT_MAGENTA = 105
+    BG_LIGHT_CYAN = 106
+    BG_LIGHT_WHITE = 107
+
+
+class AnsiState(object):
+
+    def __init__(self):
+        self.default_attrs = None
+
+        self.bold = False
+        self.bg_light = False
+        self.fg_light = False
+
+        self.saved_pos = (0, 0)
+
+    def do_text_action(self, attrs, action):
+        # In case the external state has changed, apply it it to ours.
+        # Mostly the first time this is called.
+        if attrs & winapi.FOREGROUND_INTENSITY and not self.fg_light \
+                and not self.bold:
+            self.fg_light = True
+        if attrs & winapi.BACKGROUND_INTENSITY and not self.bg_light:
+            self.bg_light = True
+
+        dark_fg = {
+            TextAction.FG_BLACK: 0,
+            TextAction.FG_RED: winapi.FOREGROUND_RED,
+            TextAction.FG_GREEN: winapi.FOREGROUND_GREEN,
+            TextAction.FG_YELLOW:
+                winapi.FOREGROUND_GREEN | winapi.FOREGROUND_RED,
+            TextAction.FG_BLUE: winapi.FOREGROUND_BLUE,
+            TextAction.FG_MAGENTA: winapi.FOREGROUND_BLUE |
+                winapi.FOREGROUND_RED,
+            TextAction.FG_CYAN:
+                winapi.FOREGROUND_BLUE | winapi.FOREGROUND_GREEN,
+            TextAction.FG_WHITE:
+                winapi.FOREGROUND_BLUE | winapi.FOREGROUND_GREEN |
+                winapi.FOREGROUND_RED,
+        }
+
+        dark_bg = {
+            TextAction.BG_BLACK: 0,
+            TextAction.BG_RED: winapi.BACKGROUND_RED,
+            TextAction.BG_GREEN: winapi.BACKGROUND_GREEN,
+            TextAction.BG_YELLOW:
+                winapi.BACKGROUND_GREEN | winapi.BACKGROUND_RED,
+            TextAction.BG_BLUE: winapi.BACKGROUND_BLUE,
+            TextAction.BG_MAGENTA:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_RED,
+            TextAction.BG_CYAN:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_GREEN,
+            TextAction.BG_WHITE:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_GREEN |
+                winapi.BACKGROUND_RED,
+        }
+
+        light_fg = {
+            TextAction.FG_LIGHT_BLACK: 0,
+            TextAction.FG_LIGHT_RED: winapi.FOREGROUND_RED,
+            TextAction.FG_LIGHT_GREEN: winapi.FOREGROUND_GREEN,
+            TextAction.FG_LIGHT_YELLOW:
+                winapi.FOREGROUND_GREEN | winapi.FOREGROUND_RED,
+            TextAction.FG_LIGHT_BLUE: winapi.FOREGROUND_BLUE,
+            TextAction.FG_LIGHT_MAGENTA:
+                winapi.FOREGROUND_BLUE | winapi.FOREGROUND_RED,
+            TextAction.FG_LIGHT_CYAN:
+                winapi.FOREGROUND_BLUE | winapi.FOREGROUND_GREEN,
+            TextAction.FG_LIGHT_WHITE:
+                winapi.FOREGROUND_BLUE | winapi.FOREGROUND_GREEN |
+                winapi.FOREGROUND_RED,
+        }
+
+        light_bg = {
+            TextAction.BG_LIGHT_BLACK: 0,
+            TextAction.BG_LIGHT_RED: winapi.BACKGROUND_RED,
+            TextAction.BG_LIGHT_GREEN: winapi.BACKGROUND_GREEN,
+            TextAction.BG_LIGHT_YELLOW:
+                winapi.BACKGROUND_GREEN | winapi.BACKGROUND_RED,
+            TextAction.BG_LIGHT_BLUE: winapi.BACKGROUND_BLUE,
+            TextAction.BG_LIGHT_MAGENTA:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_RED,
+            TextAction.BG_LIGHT_CYAN:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_GREEN,
+            TextAction.BG_LIGHT_WHITE:
+                winapi.BACKGROUND_BLUE | winapi.BACKGROUND_GREEN |
+                winapi.BACKGROUND_RED,
+        }
+
+        if action == TextAction.RESET_ALL:
+            attrs = self.default_attrs
+            self.bold = self.fg_light = self.bg_light = False
+        elif action == TextAction.SET_BOLD:
+            self.bold = True
+        elif action == TextAction.RESET_BOLD:
+            self.bold = False
+        elif action == TextAction.SET_DIM:
+            self.bold = False
+        elif action == TextAction.SET_REVERSE:
+            attrs |= winapi.COMMON_LVB_REVERSE_VIDEO
+        elif action == TextAction.RESET_REVERSE:
+            attrs &= ~winapi.COMMON_LVB_REVERSE_VIDEO
+        elif action == TextAction.SET_UNDERLINE:
+            attrs |= winapi.COMMON_LVB_UNDERSCORE
+        elif action == TextAction.RESET_UNDERLINE:
+            attrs &= ~winapi.COMMON_LVB_UNDERSCORE
+        elif action == TextAction.FG_DEFAULT:
+            attrs = (attrs & ~0xF) | (self.default_attrs & 0xF)
+            self.fg_light = False
+        elif action == TextAction.BG_DEFAULT:
+            attrs = (attrs & ~0xF0) | (self.default_attrs & 0xF0)
+            self.bg_light = False
+        elif action in dark_fg:
+            attrs = (attrs & ~0xF) | dark_fg[action]
+            self.fg_light = False
+        elif action in dark_bg:
+            attrs = (attrs & ~0xF0) | dark_bg[action]
+            self.bg_light = False
+        elif action in light_fg:
+            attrs = (attrs & ~0xF) | light_fg[action]
+            self.fg_light = True
+        elif action in light_bg:
+            attrs = (attrs & ~0xF0) | light_bg[action]
+            self.bg_light = True
+
+        if self.fg_light or self.bold:
+            attrs |= winapi.FOREGROUND_INTENSITY
+        else:
+            attrs &= ~winapi.FOREGROUND_INTENSITY
+
+        if self.bg_light:
+            attrs |= winapi.BACKGROUND_INTENSITY
+        else:
+            attrs &= ~winapi.BACKGROUND_INTENSITY
+
+        return attrs
+
+    def apply(self, handle, code):
+        buffer_info = winapi.CONSOLE_SCREEN_BUFFER_INFO()
+        if not winapi.GetConsoleScreenBufferInfo(handle,
+                                                 ctypes.byref(buffer_info)):
+            return
+
+        attrs = buffer_info.wAttributes
+
+        # We take the first attrs we see as default
+        if self.default_attrs is None:
+            self.default_attrs = attrs
+            # Make sure that like with linux terminals the program doesn't
+            # affect the prompt after it exits
+            atexit.register(
+                winapi.SetConsoleTextAttribute, handle, self.default_attrs)
+
+        cmd, args = ansi_parse(code)
+        if cmd == AnsiCommand.TEXT:
+            for action in args:
+                attrs = self.do_text_action(attrs, action)
+            winapi.SetConsoleTextAttribute(handle, attrs)
+        elif cmd in (AnsiCommand.MOVE_UP, AnsiCommand.MOVE_DOWN,
+                     AnsiCommand.MOVE_FORWARD, AnsiCommand.MOVE_BACKWARD):
+
+            coord = buffer_info.dwCursorPosition
+            x, y = coord.X, coord.Y
+
+            amount = max(args[0], 1)
+
+            if cmd == AnsiCommand.MOVE_UP:
+                y -= amount
+            elif cmd == AnsiCommand.MOVE_DOWN:
+                y += amount
+            elif cmd == AnsiCommand.MOVE_FORWARD:
+                x += amount
+            elif cmd == AnsiCommand.MOVE_BACKWARD:
+                x -= amount
+
+            x = max(x, 0)
+            y = max(y, 0)
+            winapi.SetConsoleCursorPosition(handle, winapi.COORD(x, y))
+        elif cmd in (AnsiCommand.SET_POS, AnsiCommand.SET_POS_ALT):
+            args = list(args)
+            while len(args) < 2:
+                args.append(0)
+            x, y = args[:2]
+
+            win_rect = buffer_info.srWindow
+            x += win_rect.Left - 1
+            y += win_rect.Top - 1
+
+            x = max(x, 0)
+            y = max(y, 0)
+            winapi.SetConsoleCursorPosition(handle, winapi.COORD(x, y))
+        elif cmd == AnsiCommand.SAVE_POS:
+            win_rect = buffer_info.srWindow
+            coord = buffer_info.dwCursorPosition
+            x, y = coord.X, coord.Y
+            x -= win_rect.Left
+            y -= win_rect.Top
+            self.saved_pos = (x, y)
+        elif cmd == AnsiCommand.RESTORE_POS:
+            win_rect = buffer_info.srWindow
+            x, y = self.saved_pos
+            x += win_rect.Left
+            y += win_rect.Top
+            winapi.SetConsoleCursorPosition(handle, winapi.COORD(x, y))
@@ -0,0 +1,183 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# Permission is hereby granted, free of charge, to any person obtaining
+# a copy of this software and associated documentation files (the
+# "Software"), to deal in the Software without restriction, including
+# without limitation the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the Software, and to
+# permit persons to whom the Software is furnished to do so, subject to
+# the following conditions:
+#
+# The above copyright notice and this permission notice shall be
+# included in all copies or substantial portions of the Software.
+
+import ctypes
+from ctypes import WinDLL, wintypes
+
+
+shell32 = WinDLL("shell32")
+kernel32 = WinDLL("kernel32")
+shlwapi = WinDLL("shlwapi")
+
+GetCommandLineW = kernel32.GetCommandLineW
+GetCommandLineW.argtypes = []
+GetCommandLineW.restype = wintypes.LPCWSTR
+
+CommandLineToArgvW = shell32.CommandLineToArgvW
+CommandLineToArgvW.argtypes = [
+    wintypes.LPCWSTR, ctypes.POINTER(ctypes.c_int)]
+CommandLineToArgvW.restype = ctypes.POINTER(wintypes.LPWSTR)
+
+LocalFree = kernel32.LocalFree
+LocalFree.argtypes = [wintypes.HLOCAL]
+LocalFree.restype = wintypes.HLOCAL
+
+# https://msdn.microsoft.com/en-us/library/windows/desktop/aa383751.aspx
+LPCTSTR = ctypes.c_wchar_p
+LPWSTR = wintypes.LPWSTR
+LPCWSTR = ctypes.c_wchar_p
+LPTSTR = LPWSTR
+PCWSTR = ctypes.c_wchar_p
+PCTSTR = PCWSTR
+PWSTR = ctypes.c_wchar_p
+PTSTR = PWSTR
+LPVOID = wintypes.LPVOID
+WCHAR = wintypes.WCHAR
+LPSTR = ctypes.c_char_p
+
+BOOL = wintypes.BOOL
+LPBOOL = ctypes.POINTER(BOOL)
+UINT = wintypes.UINT
+WORD = wintypes.WORD
+DWORD = wintypes.DWORD
+SHORT = wintypes.SHORT
+HANDLE = wintypes.HANDLE
+ULONG = wintypes.ULONG
+LPCSTR = wintypes.LPCSTR
+
+STD_INPUT_HANDLE = DWORD(-10)
+STD_OUTPUT_HANDLE = DWORD(-11)
+STD_ERROR_HANDLE = DWORD(-12)
+
+INVALID_HANDLE_VALUE = wintypes.HANDLE(-1).value
+
+INTERNET_MAX_SCHEME_LENGTH = 32
+INTERNET_MAX_PATH_LENGTH = 2048
+INTERNET_MAX_URL_LENGTH = (
+    INTERNET_MAX_SCHEME_LENGTH + len("://") + INTERNET_MAX_PATH_LENGTH)
+
+FOREGROUND_BLUE = 0x0001
+FOREGROUND_GREEN = 0x0002
+FOREGROUND_RED = 0x0004
+FOREGROUND_INTENSITY = 0x0008
+
+BACKGROUND_BLUE = 0x0010
+BACKGROUND_GREEN = 0x0020
+BACKGROUND_RED = 0x0040
+BACKGROUND_INTENSITY = 0x0080
+
+COMMON_LVB_REVERSE_VIDEO = 0x4000
+COMMON_LVB_UNDERSCORE = 0x8000
+
+UrlCreateFromPathW = shlwapi.UrlCreateFromPathW
+UrlCreateFromPathW.argtypes = [
+    PCTSTR, PTSTR, ctypes.POINTER(DWORD), DWORD]
+UrlCreateFromPathW.restype = ctypes.HRESULT
+
+SetEnvironmentVariableW = kernel32.SetEnvironmentVariableW
+SetEnvironmentVariableW.argtypes = [LPCTSTR, LPCTSTR]
+SetEnvironmentVariableW.restype = wintypes.BOOL
+
+GetEnvironmentVariableW = kernel32.GetEnvironmentVariableW
+GetEnvironmentVariableW.argtypes = [LPCTSTR, LPTSTR, DWORD]
+GetEnvironmentVariableW.restype = DWORD
+
+GetEnvironmentStringsW = kernel32.GetEnvironmentStringsW
+GetEnvironmentStringsW.argtypes = []
+GetEnvironmentStringsW.restype = ctypes.c_void_p
+
+FreeEnvironmentStringsW = kernel32.FreeEnvironmentStringsW
+FreeEnvironmentStringsW.argtypes = [ctypes.c_void_p]
+FreeEnvironmentStringsW.restype = ctypes.c_bool
+
+GetStdHandle = kernel32.GetStdHandle
+GetStdHandle.argtypes = [DWORD]
+GetStdHandle.restype = HANDLE
+
+
+class COORD(ctypes.Structure):
+
+    _fields_ = [
+        ("X", SHORT),
+        ("Y", SHORT),
+    ]
+
+
+class SMALL_RECT(ctypes.Structure):
+
+    _fields_ = [
+        ("Left", SHORT),
+        ("Top", SHORT),
+        ("Right", SHORT),
+        ("Bottom", SHORT),
+    ]
+
+
+class CONSOLE_SCREEN_BUFFER_INFO(ctypes.Structure):
+
+    _fields_ = [
+        ("dwSize", COORD),
+        ("dwCursorPosition", COORD),
+        ("wAttributes", WORD),
+        ("srWindow", SMALL_RECT),
+        ("dwMaximumWindowSize", COORD),
+    ]
+
+
+GetConsoleScreenBufferInfo = kernel32.GetConsoleScreenBufferInfo
+GetConsoleScreenBufferInfo.argtypes = [
+    HANDLE, ctypes.POINTER(CONSOLE_SCREEN_BUFFER_INFO)]
+GetConsoleScreenBufferInfo.restype = BOOL
+
+GetConsoleOutputCP = kernel32.GetConsoleOutputCP
+GetConsoleOutputCP.argtypes = []
+GetConsoleOutputCP.restype = UINT
+
+SetConsoleOutputCP = kernel32.SetConsoleOutputCP
+SetConsoleOutputCP.argtypes = [UINT]
+SetConsoleOutputCP.restype = BOOL
+
+GetConsoleCP = kernel32.GetConsoleCP
+GetConsoleCP.argtypes = []
+GetConsoleCP.restype = UINT
+
+SetConsoleCP = kernel32.SetConsoleCP
+SetConsoleCP.argtypes = [UINT]
+SetConsoleCP.restype = BOOL
+
+SetConsoleTextAttribute = kernel32.SetConsoleTextAttribute
+SetConsoleTextAttribute.argtypes = [HANDLE, WORD]
+SetConsoleTextAttribute.restype = BOOL
+
+SetConsoleCursorPosition = kernel32.SetConsoleCursorPosition
+SetConsoleCursorPosition.argtypes = [HANDLE, COORD]
+SetConsoleCursorPosition.restype = BOOL
+
+ReadConsoleW = kernel32.ReadConsoleW
+ReadConsoleW.argtypes = [HANDLE, LPVOID, DWORD, ctypes.POINTER(DWORD), LPVOID]
+ReadConsoleW.restype = BOOL
+
+MultiByteToWideChar = kernel32.MultiByteToWideChar
+MultiByteToWideChar.argtypes = [
+    UINT, DWORD, LPCSTR, ctypes.c_int, LPWSTR, ctypes.c_int]
+MultiByteToWideChar.restype = ctypes.c_int
+
+WideCharToMultiByte = kernel32.WideCharToMultiByte
+WideCharToMultiByte.argtypes = [
+    UINT, DWORD, LPCWSTR, ctypes.c_int, LPSTR, ctypes.c_int, LPCSTR, LPBOOL]
+WideCharToMultiByte.restpye = ctypes.c_int
+
+MoveFileW = kernel32.MoveFileW
+MoveFileW.argtypes = [LPCTSTR, LPCTSTR]
+MoveFileW.restype = BOOL
@@ -1,14 +1,107 @@
+# -*- coding: utf-8 -*-
 # Copyright (C) 2005  Michael Urman
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+from ._util import loadfile


-class Metadata(object):
-    """An abstract dict-like object.
+class PaddingInfo(object):
+    """PaddingInfo()

-    Metadata is the base class for many of the tag objects in Mutagen.
+    Abstract padding information object.
+
+    This will be passed to the callback function that can be used
+    for saving tags.
+
+    ::
+
+        def my_callback(info: PaddingInfo):
+            return info.get_default_padding()
+
+    The callback should return the amount of padding to use (>= 0) based on
+    the content size and the padding of the file after saving. The actual used
+    amount of padding might vary depending on the file format (due to
+    alignment etc.)
+
+    The default implementation can be accessed using the
+    :meth:`get_default_padding` method in the callback.
+
+    Attributes:
+        padding (`int`): The amount of padding left after saving in bytes
+            (can be negative if more data needs to be added as padding is
+            available)
+        size (`int`): The amount of data following the padding
+    """
+
+    def __init__(self, padding, size):
+        self.padding = padding
+        self.size = size
+
+    def get_default_padding(self):
+        """The default implementation which tries to select a reasonable
+        amount of padding and which might change in future versions.
+
+        Returns:
+            int: Amount of padding after saving
+        """
+
+        high = 1024 * 10 + self.size // 100  # 10 KiB + 1% of trailing data
+        low = 1024 + self.size // 1000  # 1 KiB + 0.1% of trailing data
+
+        if self.padding >= 0:
+            # enough padding left
+            if self.padding > high:
+                # padding too large, reduce
+                return low
+            # just use existing padding as is
+            return self.padding
+        else:
+            # not enough padding, add some
+            return low
+
+    def _get_padding(self, user_func):
+        if user_func is None:
+            return self.get_default_padding()
+        else:
+            return user_func(self)
+
+    def __repr__(self):
+        return "<%s size=%d padding=%d>" % (
+            type(self).__name__, self.size, self.padding)
+
+
+class Tags(object):
+    """`Tags` is the base class for many of the tag objects in Mutagen.
+
+    In many cases it has a dict like interface.
+    """
+
+    __module__ = "mutagen"
+
+    def pprint(self):
+        """
+        Returns:
+            text: tag information
+        """
+
+        raise NotImplementedError
+
+
+class Metadata(Tags):
+    """Metadata(filething=None, **kwargs)
+
+    Args:
+        filething (filething): a filename or a file-like object or `None`
+            to create an empty instance (like ``ID3()``)
+
+    Like :class:`Tags` but for standalone tagging formats that are not
+    solely managed by a container format.
+
+    Provides methods to load, save and delete tags.
    """

    __module__ = "mutagen"
@@ -17,15 +110,37 @@ class Metadata(object):
        if args or kwargs:
            self.load(*args, **kwargs)

-    def load(self, *args, **kwargs):
+    @loadfile()
+    def load(self, filething, **kwargs):
        raise NotImplementedError

-    def save(self, filename=None):
-        """Save changes to a file."""
+    @loadfile(writable=False)
+    def save(self, filething, **kwargs):
+        """save(filething=None, **kwargs)
+
+        Save changes to a file.
+
+        Args:
+            filething (filething): or `None`
+        Raises:
+            MutagenError: if saving wasn't possible
+        """

        raise NotImplementedError

-    def delete(self, filename=None):
-        """Remove tags from a file."""
+    @loadfile(writable=False)
+    def delete(self, filething):
+        """delete(filething=None)
+
+        Remove tags from a file.
+
+        In most cases this means any traces of the tag will be removed
+        from the file.
+
+        Args:
+            filething (filething): or `None`
+        Raises:
+            MutagenError: if deleting wasn't possible
+        """

        raise NotImplementedError
@@ -0,0 +1,7 @@
+# -*- coding: utf-8 -*-
+# Copyright 2016 Christoph Reiter
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
@@ -0,0 +1,95 @@
+# -*- coding: utf-8 -*-
+# Copyright 2015 Christoph Reiter
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import os
+import signal
+import contextlib
+import optparse
+
+from mutagen._senf import print_
+from mutagen._compat import text_type, iterbytes
+
+
+def split_escape(string, sep, maxsplit=None, escape_char="\\"):
+    """Like unicode/str/bytes.split but allows for the separator to be escaped
+
+    If passed unicode/str/bytes will only return list of unicode/str/bytes.
+    """
+
+    assert len(sep) == 1
+    assert len(escape_char) == 1
+
+    if isinstance(string, bytes):
+        if isinstance(escape_char, text_type):
+            escape_char = escape_char.encode("ascii")
+        iter_ = iterbytes
+    else:
+        iter_ = iter
+
+    if maxsplit is None:
+        maxsplit = len(string)
+
+    empty = string[:0]
+    result = []
+    current = empty
+    escaped = False
+    for char in iter_(string):
+        if escaped:
+            if char != escape_char and char != sep:
+                current += escape_char
+            current += char
+            escaped = False
+        else:
+            if char == escape_char:
+                escaped = True
+            elif char == sep and len(result) < maxsplit:
+                result.append(current)
+                current = empty
+            else:
+                current += char
+    result.append(current)
+    return result
+
+
+class SignalHandler(object):
+
+    def __init__(self):
+        self._interrupted = False
+        self._nosig = False
+        self._init = False
+
+    def init(self):
+        signal.signal(signal.SIGINT, self._handler)
+        signal.signal(signal.SIGTERM, self._handler)
+        if os.name != "nt":
+            signal.signal(signal.SIGHUP, self._handler)
+
+    def _handler(self, signum, frame):
+        self._interrupted = True
+        if not self._nosig:
+            raise SystemExit("Aborted...")
+
+    @contextlib.contextmanager
+    def block(self):
+        """While this context manager is active any signals for aborting
+        the process will be queued and exit the program once the context
+        is left.
+        """
+
+        self._nosig = True
+        yield
+        self._nosig = False
+        if self._interrupted:
+            raise SystemExit("Aborted...")
+
+
+class OptionParser(optparse.OptionParser):
+    """OptionParser subclass which supports printing Unicode under Windows"""
+
+    def print_help(self, file=None):
+        print_(self.format_help(), file=file)
@@ -0,0 +1,142 @@
+# -*- coding: utf-8 -*-
+# Copyright 2014 Marcus Sundman
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""A program replicating the functionality of id3lib's id3cp, using mutagen for
+tag loading and saving.
+"""
+
+import sys
+import os.path
+
+import mutagen
+import mutagen.id3
+from mutagen._senf import print_, argv
+from mutagen._compat import text_type
+
+from ._util import SignalHandler, OptionParser
+
+
+VERSION = (0, 1)
+_sig = SignalHandler()
+
+
+def printerr(*args, **kwargs):
+    kwargs.setdefault("file", sys.stderr)
+    print_(*args, **kwargs)
+
+
+class ID3OptionParser(OptionParser):
+    def __init__(self):
+        mutagen_version = mutagen.version_string
+        my_version = ".".join(map(str, VERSION))
+        version = "mid3cp %s\nUses Mutagen %s" % (my_version, mutagen_version)
+        self.disable_interspersed_args()
+        OptionParser.__init__(
+            self, version=version,
+            usage="%prog [option(s)] <src> <dst>",
+            description=("Copies ID3 tags from <src> to <dst>. Mutagen-based "
+                         "replacement for id3lib's id3cp."))
+
+
+def copy(src, dst, merge, write_v1=True, excluded_tags=None, verbose=False):
+    """Returns 0 on success"""
+
+    if excluded_tags is None:
+        excluded_tags = []
+
+    try:
+        id3 = mutagen.id3.ID3(src, translate=False)
+    except mutagen.id3.ID3NoHeaderError:
+        print_(u"No ID3 header found in ", src, file=sys.stderr)
+        return 1
+    except Exception as err:
+        print_(str(err), file=sys.stderr)
+        return 1
+
+    if verbose:
+        print_(u"File", src, u"contains:", file=sys.stderr)
+        print_(id3.pprint(), file=sys.stderr)
+
+    for tag in excluded_tags:
+        id3.delall(tag)
+
+    if merge:
+        try:
+            target = mutagen.id3.ID3(dst, translate=False)
+        except mutagen.id3.ID3NoHeaderError:
+            # no need to merge
+            pass
+        except Exception as err:
+            print_(str(err), file=sys.stderr)
+            return 1
+        else:
+            for frame in id3.values():
+                target.add(frame)
+
+            id3 = target
+
+    # if the source is 2.3 save it as 2.3
+    if id3.version < (2, 4, 0):
+        id3.update_to_v23()
+        v2_version = 3
+    else:
+        id3.update_to_v24()
+        v2_version = 4
+
+    try:
+        id3.save(dst, v1=(2 if write_v1 else 0), v2_version=v2_version)
+    except Exception as err:
+        print_(u"Error saving", dst, u":\n%s" % text_type(err),
+               file=sys.stderr)
+        return 1
+    else:
+        if verbose:
+            print_(u"Successfully saved", dst, file=sys.stderr)
+        return 0
+
+
+def main(argv):
+    parser = ID3OptionParser()
+    parser.add_option("-v", "--verbose", action="store_true", dest="verbose",
+                      help="print out saved tags", default=False)
+    parser.add_option("--write-v1", action="store_true", dest="write_v1",
+                      default=False, help="write id3v1 tags")
+    parser.add_option("-x", "--exclude-tag", metavar="TAG", action="append",
+                      dest="x", help="exclude the specified tag", default=[])
+    parser.add_option("--merge", action="store_true",
+                      help="Copy over frames instead of the whole ID3 tag",
+                      default=False)
+    (options, args) = parser.parse_args(argv[1:])
+
+    if len(args) != 2:
+        parser.print_help(file=sys.stderr)
+        return 1
+
+    (src, dst) = args
+
+    if not os.path.isfile(src):
+        print_(u"File not found:", src, file=sys.stderr)
+        parser.print_help(file=sys.stderr)
+        return 1
+
+    if not os.path.isfile(dst):
+        printerr(u"File not found:", dst, file=sys.stderr)
+        parser.print_help(file=sys.stderr)
+        return 1
+
+    # Strip tags - "-x FOO" adds whitespace at the beginning of the tag name
+    excluded_tags = [x.strip() for x in options.x]
+
+    with _sig.block():
+        return copy(src, dst, options.merge, options.write_v1, excluded_tags,
+                    options.verbose)
+
+
+def entry_point():
+    _sig.init()
+    return main(argv)
@@ -0,0 +1,171 @@
+# -*- coding: utf-8 -*-
+# Copyright 2006 Emfox Zhou <EmfoxZhou@gmail.com>
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""
+ID3iconv is a Java based ID3 encoding convertor, here's the Python version.
+"""
+
+import sys
+import locale
+
+import mutagen
+import mutagen.id3
+from mutagen._senf import argv, print_, fsnative
+from mutagen._compat import text_type
+
+from ._util import SignalHandler, OptionParser
+
+
+VERSION = (0, 3)
+_sig = SignalHandler()
+
+
+def getpreferredencoding():
+    return locale.getpreferredencoding() or "utf-8"
+
+
+def isascii(string):
+    """Checks whether a unicode string is non-empty and contains only ASCII
+    characters.
+    """
+    if not string:
+        return False
+
+    try:
+        string.encode('ascii')
+    except UnicodeEncodeError:
+        return False
+
+    return True
+
+
+class ID3OptionParser(OptionParser):
+    def __init__(self):
+        mutagen_version = ".".join(map(str, mutagen.version))
+        my_version = ".".join(map(str, VERSION))
+        version = "mid3iconv %s\nUses Mutagen %s" % (
+            my_version, mutagen_version)
+        return OptionParser.__init__(
+            self, version=version,
+            usage="%prog [OPTION] [FILE]...",
+            description=("Mutagen-based replacement the id3iconv utility, "
+                         "which converts ID3 tags from legacy encodings "
+                         "to Unicode and stores them using the ID3v2 format."))
+
+    def format_help(self, *args, **kwargs):
+        text = OptionParser.format_help(self, *args, **kwargs)
+        return text + "\nFiles are updated in-place, so use --dry-run first.\n"
+
+
+def update(options, filenames):
+    encoding = options.encoding or getpreferredencoding()
+    verbose = options.verbose
+    noupdate = options.noupdate
+    force_v1 = options.force_v1
+    remove_v1 = options.remove_v1
+
+    def conv(uni):
+        return uni.encode('iso-8859-1').decode(encoding)
+
+    for filename in filenames:
+        with _sig.block():
+            if verbose != "quiet":
+                print_(u"Updating", filename)
+
+            if has_id3v1(filename) and not noupdate and force_v1:
+                mutagen.id3.delete(filename, False, True)
+
+            try:
+                id3 = mutagen.id3.ID3(filename)
+            except mutagen.id3.ID3NoHeaderError:
+                if verbose != "quiet":
+                    print_(u"No ID3 header found; skipping...")
+                continue
+            except Exception as err:
+                print_(text_type(err), file=sys.stderr)
+                continue
+
+            for tag in filter(lambda t: t.startswith(("T", "COMM")), id3):
+                frame = id3[tag]
+                if isinstance(frame, mutagen.id3.TimeStampTextFrame):
+                    # non-unicode fields
+                    continue
+                try:
+                    text = frame.text
+                except AttributeError:
+                    continue
+                try:
+                    text = [conv(x) for x in frame.text]
+                except (UnicodeError, LookupError):
+                    continue
+                else:
+                    frame.text = text
+                    if not text or min(map(isascii, text)):
+                        frame.encoding = 3
+                    else:
+                        frame.encoding = 1
+
+            if verbose == "debug":
+                print_(id3.pprint())
+
+            if not noupdate:
+                if remove_v1:
+                    id3.save(filename, v1=False)
+                else:
+                    id3.save(filename)
+
+
+def has_id3v1(filename):
+    try:
+        with open(filename, 'rb+') as f:
+            f.seek(-128, 2)
+            return f.read(3) == b"TAG"
+    except IOError:
+        return False
+
+
+def main(argv):
+    parser = ID3OptionParser()
+    parser.add_option(
+        "-e", "--encoding", metavar="ENCODING", action="store",
+        type="string", dest="encoding",
+        help=("Specify original tag encoding (default is %s)" % (
+              getpreferredencoding())))
+    parser.add_option(
+        "-p", "--dry-run", action="store_true", dest="noupdate",
+        help="Do not actually modify files")
+    parser.add_option(
+        "--force-v1", action="store_true", dest="force_v1",
+        help="Use an ID3v1 tag even if an ID3v2 tag is present")
+    parser.add_option(
+        "--remove-v1", action="store_true", dest="remove_v1",
+        help="Remove v1 tag after processing the files")
+    parser.add_option(
+        "-q", "--quiet", action="store_const", dest="verbose",
+        const="quiet", help="Only output errors")
+    parser.add_option(
+        "-d", "--debug", action="store_const", dest="verbose",
+        const="debug", help="Output updated tags")
+
+    for i, arg in enumerate(argv):
+        if arg == "-v1":
+            argv[i] = fsnative(u"--force-v1")
+        elif arg == "-removev1":
+            argv[i] = fsnative(u"--remove-v1")
+
+    (options, args) = parser.parse_args(argv[1:])
+
+    if args:
+        update(options, args)
+    else:
+        parser.print_help()
+
+
+def entry_point():
+    _sig.init()
+    return main(argv)
@@ -0,0 +1,465 @@
+# -*- coding: utf-8 -*-
+# Copyright 2005 Joe Wreschnig
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""Pretend to be /usr/bin/id3v2 from id3lib, sort of."""
+
+import sys
+import codecs
+import mimetypes
+
+from optparse import SUPPRESS_HELP
+
+import mutagen
+import mutagen.id3
+from mutagen.id3 import Encoding, PictureType
+from mutagen._senf import fsnative, print_, argv, fsn2text, fsn2bytes, \
+    bytes2fsn
+from mutagen._compat import PY2, text_type
+
+from ._util import split_escape, SignalHandler, OptionParser
+
+
+VERSION = (1, 3)
+_sig = SignalHandler()
+
+global verbose
+verbose = True
+
+
+class ID3OptionParser(OptionParser):
+    def __init__(self):
+        mutagen_version = ".".join(map(str, mutagen.version))
+        my_version = ".".join(map(str, VERSION))
+        version = "mid3v2 %s\nUses Mutagen %s" % (my_version, mutagen_version)
+        self.edits = []
+        OptionParser.__init__(
+            self, version=version,
+            usage="%prog [OPTION] [FILE]...",
+            description="Mutagen-based replacement for id3lib's id3v2.")
+
+    def format_help(self, *args, **kwargs):
+        text = OptionParser.format_help(self, *args, **kwargs)
+        return text + """\
+You can set the value for any ID3v2 frame by using '--' and then a frame ID.
+For example:
+        mid3v2 --TIT3 "Monkey!" file.mp3
+would set the "Subtitle/Description" frame to "Monkey!".
+
+Any editing operation will cause the ID3 tag to be upgraded to ID3v2.4.
+"""
+
+
+def list_frames(option, opt, value, parser):
+    items = mutagen.id3.Frames.items()
+    for name, frame in sorted(items):
+        print_(u"    --%s    %s" % (name, frame.__doc__.split("\n")[0]))
+    raise SystemExit
+
+
+def list_frames_2_2(option, opt, value, parser):
+    items = mutagen.id3.Frames_2_2.items()
+    items.sort()
+    for name, frame in items:
+        print_(u"    --%s    %s" % (name, frame.__doc__.split("\n")[0]))
+    raise SystemExit
+
+
+def list_genres(option, opt, value, parser):
+    for i, genre in enumerate(mutagen.id3.TCON.GENRES):
+        print_(u"%3d: %s" % (i, genre))
+    raise SystemExit
+
+
+def delete_tags(filenames, v1, v2):
+    for filename in filenames:
+        with _sig.block():
+            if verbose:
+                print_(u"deleting ID3 tag info in", filename, file=sys.stderr)
+            mutagen.id3.delete(filename, v1, v2)
+
+
+def delete_frames(deletes, filenames):
+
+    try:
+        deletes = frame_from_fsnative(deletes)
+    except ValueError as err:
+        print_(text_type(err), file=sys.stderr)
+
+    frames = deletes.split(",")
+
+    for filename in filenames:
+        with _sig.block():
+            if verbose:
+                print_(u"deleting %s from" % deletes, filename,
+                       file=sys.stderr)
+            try:
+                id3 = mutagen.id3.ID3(filename)
+            except mutagen.id3.ID3NoHeaderError:
+                if verbose:
+                    print_(u"No ID3 header found; skipping.", file=sys.stderr)
+            except Exception as err:
+                print_(text_type(err), file=sys.stderr)
+                raise SystemExit(1)
+            else:
+                for frame in frames:
+                    id3.delall(frame)
+                id3.save()
+
+
+def frame_from_fsnative(arg):
+    """Takes item from argv and returns ascii native str
+    or raises ValueError.
+    """
+
+    assert isinstance(arg, fsnative)
+
+    text = fsn2text(arg, strict=True)
+    if PY2:
+        return text.encode("ascii")
+    else:
+        return text.encode("ascii").decode("ascii")
+
+
+def value_from_fsnative(arg, escape):
+    """Takes an item from argv and returns a text_type value without
+    surrogate escapes or raises ValueError.
+    """
+
+    assert isinstance(arg, fsnative)
+
+    if escape:
+        bytes_ = fsn2bytes(arg, "utf-8")
+        if PY2:
+            bytes_ = bytes_.decode("string_escape")
+        else:
+            bytes_ = codecs.escape_decode(bytes_)[0]
+        arg = bytes2fsn(bytes_, "utf-8")
+
+    text = fsn2text(arg, strict=True)
+    return text
+
+
+def error(*args):
+    print_(*args, file=sys.stderr)
+    raise SystemExit(1)
+
+
+def get_frame_encoding(frame_id, value):
+    if frame_id == "APIC":
+        # See https://github.com/beetbox/beets/issues/899#issuecomment-62437773
+        return Encoding.UTF16 if value else Encoding.LATIN1
+    else:
+        return Encoding.UTF8
+
+
+def write_files(edits, filenames, escape):
+    # unescape escape sequences and decode values
+    encoded_edits = []
+    for frame, value in edits:
+        if not value:
+            continue
+
+        try:
+            frame = frame_from_fsnative(frame)
+        except ValueError as err:
+            print_(text_type(err), file=sys.stderr)
+
+        assert isinstance(frame, str)
+
+        # strip "--"
+        frame = frame[2:]
+
+        try:
+            value = value_from_fsnative(value, escape)
+        except ValueError as err:
+            error(u"%s: %s" % (frame, text_type(err)))
+
+        assert isinstance(value, text_type)
+
+        encoded_edits.append((frame, value))
+    edits = encoded_edits
+
+    # preprocess:
+    #   for all [frame,value] pairs in the edits list
+    #      gather values for identical frames into a list
+    tmp = {}
+    for frame, value in edits:
+        if frame in tmp:
+            tmp[frame].append(value)
+        else:
+            tmp[frame] = [value]
+    # edits is now a dictionary of frame -> [list of values]
+    edits = tmp
+
+    # escape also enables escaping of the split separator
+    if escape:
+        string_split = split_escape
+    else:
+        string_split = lambda s, *args, **kwargs: s.split(*args, **kwargs)
+
+    for filename in filenames:
+        with _sig.block():
+            if verbose:
+                print_(u"Writing", filename, file=sys.stderr)
+            try:
+                id3 = mutagen.id3.ID3(filename)
+            except mutagen.id3.ID3NoHeaderError:
+                if verbose:
+                    print_(u"No ID3 header found; creating a new tag",
+                          file=sys.stderr)
+                id3 = mutagen.id3.ID3()
+            except Exception as err:
+                print_(str(err), file=sys.stderr)
+                continue
+            for (frame, vlist) in edits.items():
+                if frame == "POPM":
+                    for value in vlist:
+                        values = string_split(value, ":")
+                        if len(values) == 1:
+                            email, rating, count = values[0], 0, 0
+                        elif len(values) == 2:
+                            email, rating, count = values[0], values[1], 0
+                        else:
+                            email, rating, count = values
+
+                        frame = mutagen.id3.POPM(
+                            email=email, rating=int(rating), count=int(count))
+                        id3.add(frame)
+                elif frame == "APIC":
+                    for value in vlist:
+                        values = string_split(value, ":")
+                        # FIXME: doesn't support filenames with an invalid
+                        # encoding since we have already decoded at that point
+                        fn = values[0]
+
+                        if len(values) >= 2:
+                            desc = values[1]
+                        else:
+                            desc = u"cover"
+
+                        if len(values) >= 3:
+                            try:
+                                picture_type = int(values[2])
+                            except ValueError:
+                                error(u"Invalid picture type: %r" % values[1])
+                        else:
+                            picture_type = PictureType.COVER_FRONT
+
+                        if len(values) >= 4:
+                            mime = values[3]
+                        else:
+                            mime = mimetypes.guess_type(fn)[0] or "image/jpeg"
+
+                        if len(values) >= 5:
+                            error("APIC: Invalid format")
+
+                        encoding = get_frame_encoding(frame, desc)
+
+                        try:
+                            with open(fn, "rb") as h:
+                                data = h.read()
+                        except IOError as e:
+                            error(text_type(e))
+
+                        frame = mutagen.id3.APIC(encoding=encoding, mime=mime,
+                            desc=desc, type=picture_type, data=data)
+
+                        id3.add(frame)
+                elif frame == "COMM":
+                    for value in vlist:
+                        values = string_split(value, ":")
+                        if len(values) == 1:
+                            value, desc, lang = values[0], "", "eng"
+                        elif len(values) == 2:
+                            desc, value, lang = values[0], values[1], "eng"
+                        else:
+                            value = ":".join(values[1:-1])
+                            desc, lang = values[0], values[-1]
+                        frame = mutagen.id3.COMM(
+                            encoding=3, text=value, lang=lang, desc=desc)
+                        id3.add(frame)
+                elif frame == "UFID":
+                    for value in vlist:
+                        values = string_split(value, ":")
+                        if len(values) != 2:
+                            error(u"Invalid value: %r" % values)
+                        owner = values[0]
+                        data = values[1].encode("utf-8")
+                        frame = mutagen.id3.UFID(owner=owner, data=data)
+                        id3.add(frame)
+                elif frame == "TXXX":
+                    for value in vlist:
+                        values = string_split(value, ":", 1)
+                        if len(values) == 1:
+                            desc, value = "", values[0]
+                        else:
+                            desc, value = values[0], values[1]
+                        frame = mutagen.id3.TXXX(
+                            encoding=3, text=value, desc=desc)
+                        id3.add(frame)
+                elif issubclass(mutagen.id3.Frames[frame],
+                                mutagen.id3.UrlFrame):
+                    frame = mutagen.id3.Frames[frame](encoding=3, url=vlist)
+                    id3.add(frame)
+                else:
+                    frame = mutagen.id3.Frames[frame](encoding=3, text=vlist)
+                    id3.add(frame)
+            id3.save(filename)
+
+
+def list_tags(filenames):
+    for filename in filenames:
+        print_("IDv2 tag info for", filename)
+        try:
+            id3 = mutagen.id3.ID3(filename, translate=False)
+        except mutagen.id3.ID3NoHeaderError:
+            print_(u"No ID3 header found; skipping.")
+        except Exception as err:
+            print_(text_type(err), file=sys.stderr)
+            raise SystemExit(1)
+        else:
+            print_(id3.pprint())
+
+
+def list_tags_raw(filenames):
+    for filename in filenames:
+        print_("Raw IDv2 tag info for", filename)
+        try:
+            id3 = mutagen.id3.ID3(filename, translate=False)
+        except mutagen.id3.ID3NoHeaderError:
+            print_(u"No ID3 header found; skipping.")
+        except Exception as err:
+            print_(text_type(err), file=sys.stderr)
+            raise SystemExit(1)
+        else:
+            for frame in id3.values():
+                print_(text_type(repr(frame)))
+
+
+def main(argv):
+    parser = ID3OptionParser()
+    parser.add_option(
+        "-v", "--verbose", action="store_true", dest="verbose", default=False,
+        help="be verbose")
+    parser.add_option(
+        "-q", "--quiet", action="store_false", dest="verbose",
+        help="be quiet (the default)")
+    parser.add_option(
+        "-e", "--escape", action="store_true", default=False,
+        help="enable interpretation of backslash escapes")
+    parser.add_option(
+        "-f", "--list-frames", action="callback", callback=list_frames,
+        help="Display all possible frames for ID3v2.3 / ID3v2.4")
+    parser.add_option(
+        "--list-frames-v2.2", action="callback", callback=list_frames_2_2,
+        help="Display all possible frames for ID3v2.2")
+    parser.add_option(
+        "-L", "--list-genres", action="callback", callback=list_genres,
+        help="Lists all ID3v1 genres")
+    parser.add_option(
+        "-l", "--list", action="store_const", dest="action", const="list",
+        help="Lists the tag(s) on the open(s)")
+    parser.add_option(
+        "--list-raw", action="store_const", dest="action", const="list-raw",
+        help="Lists the tag(s) on the open(s) in Python format")
+    parser.add_option(
+        "-d", "--delete-v2", action="store_const", dest="action",
+        const="delete-v2", help="Deletes ID3v2 tags")
+    parser.add_option(
+        "-s", "--delete-v1", action="store_const", dest="action",
+        const="delete-v1", help="Deletes ID3v1 tags")
+    parser.add_option(
+        "-D", "--delete-all", action="store_const", dest="action",
+        const="delete-v1-v2", help="Deletes ID3v1 and ID3v2 tags")
+    parser.add_option(
+        '--delete-frames', metavar='FID1,FID2,...', action='store',
+        dest='deletes', default='', help="Delete the given frames")
+    parser.add_option(
+        "-C", "--convert", action="store_const", dest="action",
+        const="convert",
+        help="Convert tags to ID3v2.4 (any editing will do this)")
+
+    parser.add_option(
+        "-a", "--artist", metavar='"ARTIST"', action="callback",
+        help="Set the artist information", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TPE1"),
+                                                     args[2])))
+    parser.add_option(
+        "-A", "--album", metavar='"ALBUM"', action="callback",
+        help="Set the album title information", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TALB"),
+                                                     args[2])))
+    parser.add_option(
+        "-t", "--song", metavar='"SONG"', action="callback",
+        help="Set the song title information", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TIT2"),
+                                                     args[2])))
+    parser.add_option(
+        "-c", "--comment", metavar='"DESCRIPTION":"COMMENT":"LANGUAGE"',
+        action="callback", help="Set the comment information", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--COMM"),
+                                                     args[2])))
+    parser.add_option(
+        "-p", "--picture",
+        metavar='"FILENAME":"DESCRIPTION":"IMAGE-TYPE":"MIME-TYPE"',
+        action="callback", help="Set the picture", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--APIC"),
+                                                     args[2])))
+    parser.add_option(
+        "-g", "--genre", metavar='"GENRE"', action="callback",
+        help="Set the genre or genre number", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TCON"),
+                                                     args[2])))
+    parser.add_option(
+        "-y", "--year", "--date", metavar='YYYY[-MM-DD]', action="callback",
+        help="Set the year/date", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TDRC"),
+                                                     args[2])))
+    parser.add_option(
+        "-T", "--track", metavar='"num/num"', action="callback",
+        help="Set the track number/(optional) total tracks", type="string",
+        callback=lambda *args: args[3].edits.append((fsnative(u"--TRCK"),
+                                                     args[2])))
+
+    for key, frame in mutagen.id3.Frames.items():
+        if (issubclass(frame, mutagen.id3.TextFrame)
+                or issubclass(frame, mutagen.id3.UrlFrame)
+                or issubclass(frame, mutagen.id3.POPM)
+                or frame in (mutagen.id3.APIC, mutagen.id3.UFID)):
+            parser.add_option(
+                "--" + key, action="callback", help=SUPPRESS_HELP,
+                type='string', metavar="value",  # optparse blows up with this
+                callback=lambda *args: args[3].edits.append(args[1:3]))
+
+    (options, args) = parser.parse_args(argv[1:])
+    global verbose
+    verbose = options.verbose
+
+    if args:
+        if parser.edits or options.deletes:
+            if options.deletes:
+                delete_frames(options.deletes, args)
+            if parser.edits:
+                write_files(parser.edits, args, options.escape)
+        elif options.action in [None, 'list']:
+            list_tags(args)
+        elif options.action == "list-raw":
+            list_tags_raw(args)
+        elif options.action == "convert":
+            write_files([], args, options.escape)
+        elif options.action.startswith("delete"):
+            delete_tags(args, "v1" in options.action, "v2" in options.action)
+        else:
+            parser.print_help()
+    else:
+        parser.print_help()
+
+
+def entry_point():
+    _sig.init()
+    return main(argv)
@@ -0,0 +1,75 @@
+# -*- coding: utf-8 -*-
+# Copyright 2006 Joe Wreschnig
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""Split a multiplex/chained Ogg file into its component parts."""
+
+import os
+
+import mutagen.ogg
+from mutagen._senf import argv
+
+from ._util import SignalHandler, OptionParser
+
+
+_sig = SignalHandler()
+
+
+def main(argv):
+    from mutagen.ogg import OggPage
+    parser = OptionParser(
+        usage="%prog [options] filename.ogg ...",
+        description="Split Ogg logical streams using Mutagen.",
+        version="Mutagen %s" % ".".join(map(str, mutagen.version))
+    )
+
+    parser.add_option(
+        "--extension", dest="extension", default="ogg", metavar='ext',
+        help="use this extension (default 'ogg')")
+    parser.add_option(
+        "--pattern", dest="pattern", default="%(base)s-%(stream)d.%(ext)s",
+        metavar='pattern', help="name files using this pattern")
+    parser.add_option(
+        "--m3u", dest="m3u", action="store_true", default=False,
+        help="generate an m3u (playlist) file")
+
+    (options, args) = parser.parse_args(argv[1:])
+    if not args:
+        raise SystemExit(parser.print_help() or 1)
+
+    format = {'ext': options.extension}
+    for filename in args:
+        with _sig.block():
+            fileobjs = {}
+            format["base"] = os.path.splitext(os.path.basename(filename))[0]
+            fileobj = open(filename, "rb")
+            if options.m3u:
+                m3u = open(format["base"] + ".m3u", "w")
+                fileobjs["m3u"] = m3u
+            else:
+                m3u = None
+            while True:
+                try:
+                    page = OggPage(fileobj)
+                except EOFError:
+                    break
+                else:
+                    format["stream"] = page.serial
+                    if page.serial not in fileobjs:
+                        new_filename = options.pattern % format
+                        new_fileobj = open(new_filename, "wb")
+                        fileobjs[page.serial] = new_fileobj
+                        if m3u:
+                            m3u.write(new_filename + "\r\n")
+                    fileobjs[page.serial].write(page.write())
+            for f in fileobjs.values():
+                f.close()
+
+
+def entry_point():
+    _sig.init()
+    return main(argv)
@@ -0,0 +1,45 @@
+# -*- coding: utf-8 -*-
+# Copyright 2005 Joe Wreschnig
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""Full tag list for any given file."""
+
+from mutagen._senf import print_, argv
+from mutagen._compat import text_type
+
+from ._util import SignalHandler, OptionParser
+
+
+_sig = SignalHandler()
+
+
+def main(argv):
+    from mutagen import File
+
+    parser = OptionParser()
+    parser.add_option("--no-flac", help="Compatibility; does nothing.")
+    parser.add_option("--no-mp3", help="Compatibility; does nothing.")
+    parser.add_option("--no-apev2", help="Compatibility; does nothing.")
+
+    (options, args) = parser.parse_args(argv[1:])
+    if not args:
+        raise SystemExit(parser.print_help() or 1)
+
+    for filename in args:
+        print_(u"--", filename)
+        try:
+            print_(u"-", File(filename).pprint())
+        except AttributeError:
+            print_(u"- Unknown file type")
+        except Exception as err:
+            print_(text_type(err))
+        print_(u"")
+
+
+def entry_point():
+    _sig.init()
+    return main(argv)
@@ -0,0 +1,116 @@
+# -*- coding: utf-8 -*-
+# Copyright 2005 Joe Wreschnig, Michael Urman
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import os
+import sys
+import traceback
+
+from mutagen._senf import print_, argv
+
+from ._util import SignalHandler
+
+
+class Report(object):
+    def __init__(self, pathname):
+        self.name = pathname
+        self.files = 0
+        self.unsync = 0
+        self.missings = 0
+        self.errors = []
+        self.exceptions = {}
+        self.versions = {}
+
+    def missing(self, filename):
+        self.missings += 1
+        self.files += 1
+
+    def error(self, filename):
+        Ex, value, trace = sys.exc_info()
+        self.exceptions.setdefault(Ex, 0)
+        self.exceptions[Ex] += 1
+        self.errors.append((filename, Ex, value, trace))
+        self.files += 1
+
+    def success(self, id3):
+        self.versions.setdefault(id3.version, 0)
+        self.versions[id3.version] += 1
+        self.files += 1
+        if id3.f_unsynch:
+            self.unsync += 1
+
+    def __str__(self):
+        strings = ["-- Report for %s --" % self.name]
+        if self.files == 0:
+            return strings[0] + "\n" + "No MP3 files found.\n"
+
+        good = self.files - len(self.errors)
+        strings.append("Loaded %d/%d files (%d%%)" % (
+            good, self.files, (float(good) / self.files) * 100))
+        strings.append("%d files with unsynchronized frames." % self.unsync)
+        strings.append("%d files without tags." % self.missings)
+
+        strings.append("\nID3 Versions:")
+        items = list(self.versions.items())
+        items.sort()
+        for v, i in items:
+            strings.append("  %s\t%d" % (".".join(map(str, v)), i))
+
+        if self.exceptions:
+            strings.append("\nExceptions:")
+            items = list(self.exceptions.items())
+            items.sort()
+            for Ex, i in items:
+                strings.append("  %-20s\t%d" % (Ex.__name__, i))
+
+        if self.errors:
+            strings.append("\nERRORS:\n")
+            for filename, Ex, value, trace in self.errors:
+                strings.append("\nReading %s:" % filename)
+                strings.append(
+                    "".join(traceback.format_exception(Ex, value, trace)[1:]))
+        else:
+            strings.append("\nNo errors!")
+
+        return("\n".join(strings))
+
+
+def check_dir(path):
+    from mutagen.mp3 import MP3
+
+    rep = Report(path)
+    print_(u"Scanning", path)
+    for path, dirs, files in os.walk(path):
+        files.sort()
+        for fn in files:
+            if not fn.lower().endswith('.mp3'):
+                continue
+            ffn = os.path.join(path, fn)
+            try:
+                mp3 = MP3(ffn)
+            except Exception:
+                rep.error(ffn)
+            else:
+                if mp3.tags is None:
+                    rep.missing(ffn)
+                else:
+                    rep.success(mp3.tags)
+
+    print_(str(rep))
+
+
+def main(argv):
+    if len(argv) == 1:
+        print_(u"Usage:", argv[0], u"directory ...")
+    else:
+        for path in argv[1:]:
+            check_dir(path)
+
+
+def entry_point():
+    SignalHandler().init()
+    return main(argv)
@@ -1,10 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2006  Joe Wreschnig
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Utility classes for Mutagen.

@@ -12,13 +12,224 @@ You should not rely on the interfaces here being stable. They are
 intended for internal use in Mutagen only.
 """

+import sys
 import struct
 import codecs
+import errno

+try:
+    import mmap
+except ImportError:
+    # Google App Engine has no mmap:
+    #   https://github.com/quodlibet/mutagen/issues/286
+    mmap = None
+
+from collections import namedtuple
+from contextlib import contextmanager
+from functools import wraps
 from fnmatch import fnmatchcase

-from ._compat import chr_, text_type, PY2, iteritems, iterbytes, \
-    integer_types, xrange
+from ._compat import chr_, PY2, iteritems, iterbytes, integer_types, xrange, \
+    izip, text_type, reraise
+
+
+def is_fileobj(fileobj):
+    """Returns:
+        bool: if an argument passed ot mutagen should be treated as a
+            file object
+    """
+
+    # open() only handles str/bytes, so we can be strict
+    return not isinstance(fileobj, (text_type, bytes))
+
+
+def verify_fileobj(fileobj, writable=False):
+    """Verifies that the passed fileobj is a file like object which
+    we can use.
+
+    Args:
+        writable (bool): verify that the file object is writable as well
+
+    Raises:
+        ValueError: In case the object is not a file object that is readable
+            (or writable if required) or is not opened in bytes mode.
+    """
+
+    try:
+        data = fileobj.read(0)
+    except Exception:
+        if not hasattr(fileobj, "read"):
+            raise ValueError("%r not a valid file object" % fileobj)
+        raise ValueError("Can't read from file object %r" % fileobj)
+
+    if not isinstance(data, bytes):
+        raise ValueError(
+            "file object %r not opened in binary mode" % fileobj)
+
+    if writable:
+        try:
+            fileobj.write(b"")
+        except Exception:
+            if not hasattr(fileobj, "write"):
+                raise ValueError("%r not a valid file object" % fileobj)
+            raise ValueError("Can't write to file object %r" % fileobj)
+
+
+def verify_filename(filename):
+    """Checks of the passed in filename has the correct type.
+
+    Raises:
+        ValueError: if not a filename
+    """
+
+    if is_fileobj(filename):
+        raise ValueError("%r not a filename" % filename)
+
+
+def fileobj_name(fileobj):
+    """
+    Returns:
+        text: A potential filename for a file object. Always a valid
+            path type, but might be empty or non-existent.
+    """
+
+    value = getattr(fileobj, "name", u"")
+    if not isinstance(value, (text_type, bytes)):
+        value = text_type(value)
+    return value
+
+
+def loadfile(method=True, writable=False, create=False):
+    """A decorator for functions taking a `filething` as a first argument.
+
+    Passes a FileThing instance as the first argument to the wrapped function.
+
+    Args:
+        method (bool): If the wrapped functions is a method
+        writable (bool): If a filename is passed opens the file readwrite, if
+            passed a file object verifies that it is writable.
+        create (bool): If passed a filename that does not exist will create
+            a new empty file.
+    """
+
+    def convert_file_args(args, kwargs):
+        filething = args[0] if args else None
+        filename = kwargs.pop("filename", None)
+        fileobj = kwargs.pop("fileobj", None)
+        return filething, filename, fileobj, args[1:], kwargs
+
+    def wrap(func):
+
+        @wraps(func)
+        def wrapper(self, *args, **kwargs):
+            filething, filename, fileobj, args, kwargs = \
+                convert_file_args(args, kwargs)
+            with _openfile(self, filething, filename, fileobj,
+                           writable, create) as h:
+                return func(self, h, *args, **kwargs)
+
+        @wraps(func)
+        def wrapper_func(*args, **kwargs):
+            filething, filename, fileobj, args, kwargs = \
+                convert_file_args(args, kwargs)
+            with _openfile(None, filething, filename, fileobj,
+                           writable, create) as h:
+                return func(h, *args, **kwargs)
+
+        return wrapper if method else wrapper_func
+
+    return wrap
+
+
+def convert_error(exc_src, exc_dest):
+    """A decorator for reraising exceptions with a different type.
+    Mostly useful for IOError.
+
+    Args:
+        exc_src (type): The source exception type
+        exc_dest (type): The target exception type.
+    """
+
+    def wrap(func):
+
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            try:
+                return func(*args, **kwargs)
+            except exc_dest:
+                raise
+            except exc_src as err:
+                reraise(exc_dest, err, sys.exc_info()[2])
+
+        return wrapper
+
+    return wrap
+
+
+FileThing = namedtuple("FileThing", ["fileobj", "filename", "name"])
+"""filename is None if the source is not a filename. name is a filename which
+can be used for file type detection
+"""
+
+
+@contextmanager
+def _openfile(instance, filething, filename, fileobj, writable, create):
+    """yields a FileThing
+
+    Args:
+        filething: Either a file name, a file object or None
+        filename: Either a file name or None
+        fileobj: Either a file object or None
+        writable (bool): if the file should be opened
+        create (bool): if the file should be created if it doesn't exist.
+            implies writable
+    Raises:
+        MutagenError: In case opening the file failed
+        TypeError: in case neither a file name or a file object is passed
+    """
+
+    assert not create or writable
+
+    # to allow stacked context managers, just pass the result through
+    if isinstance(filething, FileThing):
+        filename = filething.filename
+        fileobj = filething.fileobj
+        filething = None
+
+    if filething is not None:
+        if is_fileobj(filething):
+            fileobj = filething
+        else:
+            filename = filething
+
+    if instance is not None:
+        # XXX: take "not writable" as loading the file..
+        if not writable:
+            instance.filename = filename
+        elif filename is None:
+            filename = getattr(instance, "filename", None)
+
+    if fileobj is not None:
+        verify_fileobj(fileobj, writable=writable)
+        yield FileThing(fileobj, filename, filename or fileobj_name(fileobj))
+    elif filename is not None:
+        verify_filename(filename)
+        try:
+            fileobj = open(filename, "rb+" if writable else "rb")
+        except IOError as e:
+            if create and e.errno == errno.ENOENT:
+                assert writable
+                try:
+                    fileobj = open(filename, "wb+")
+                except IOError as e2:
+                    raise MutagenError(e2)
+            else:
+                raise MutagenError(e)
+
+        with fileobj as fileobj:
+            yield FileThing(fileobj, filename, filename)
+    else:
+        raise TypeError("Missing filename or fileobj argument")


 class MutagenError(Exception):
@@ -27,8 +238,15 @@ class MutagenError(Exception):
    .. versionadded:: 1.25
    """

+    __module__ = "mutagen"
+

 def total_ordering(cls):
+    """Adds all possible ordering methods to a class.
+
+    Needs a working __eq__ and __lt__ and will supply the rest.
+    """
+
    assert "__eq__" in cls.__dict__
    assert "__lt__" in cls.__dict__

@@ -58,6 +276,25 @@ def hashable(cls):


 def enum(cls):
+    """A decorator for creating an int enum class.
+
+    Makes the values a subclass of the type and implements repr/str.
+    The new class will be a subclass of int.
+
+    Args:
+        cls (type): The class to convert to an enum
+
+    Returns:
+        type: A new class
+
+    ::
+
+        @enum
+        class Foo(object):
+            FOO = 1
+            BAR = 2
+    """
+
    assert cls.__bases__ == (object,)

    d = dict(cls.__dict__)
@@ -71,13 +308,72 @@ def enum(cls):
            setattr(new_type, key, value_instance)
            map_[value] = key

-    def repr_(self):
+    def str_(self):
        if self in map_:
            return "%s.%s" % (type(self).__name__, map_[self])
-        else:
-            return "%s(%s)" % (type(self).__name__, self)
+        return "%d" % int(self)
+
+    def repr_(self):
+        if self in map_:
+            return "<%s.%s: %d>" % (type(self).__name__, map_[self], int(self))
+        return "%d" % int(self)

    setattr(new_type, "__repr__", repr_)
+    setattr(new_type, "__str__", str_)
+
+    return new_type
+
+
+def flags(cls):
+    """A decorator for creating an int flags class.
+
+    Makes the values a subclass of the type and implements repr/str.
+    The new class will be a subclass of int.
+
+    Args:
+        cls (type): The class to convert to an flags
+
+    Returns:
+        type: A new class
+
+    ::
+
+        @flags
+        class Foo(object):
+            FOO = 1
+            BAR = 2
+    """
+
+    assert cls.__bases__ == (object,)
+
+    d = dict(cls.__dict__)
+    new_type = type(cls.__name__, (int,), d)
+    new_type.__module__ = cls.__module__
+
+    map_ = {}
+    for key, value in iteritems(d):
+        if key.upper() == key and isinstance(value, integer_types):
+            value_instance = new_type(value)
+            setattr(new_type, key, value_instance)
+            map_[value] = key
+
+    def str_(self):
+        value = int(self)
+        matches = []
+        for k, v in map_.items():
+            if value & k:
+                matches.append("%s.%s" % (type(self).__name__, v))
+                value &= ~k
+        if value != 0 or not matches:
+            matches.append(text_type(value))
+
+        return " | ".join(matches)
+
+    def repr_(self):
+        return "<%s: %d>" % (str(self), int(self))
+
+    setattr(new_type, "__repr__", repr_)
+    setattr(new_type, "__str__", str_)

    return new_type

@@ -124,7 +420,7 @@ class DictMixin(object):
        itervalues = lambda self: iter(self.values())

    def items(self):
-        return list(zip(self.keys(), self.values()))
+        return list(izip(self.keys(), self.values()))

    if PY2:
        iteritems = lambda s: iter(s.items())
@@ -237,6 +533,19 @@ def _fill_cdata(cls):
                if s.size == 1:
                    esuffix = ""
                bits = str(s.size * 8)
+
+                if unsigned:
+                    max_ = 2 ** (s.size * 8) - 1
+                    min_ = 0
+                else:
+                    max_ = 2 ** (s.size * 8 - 1) - 1
+                    min_ = - 2 ** (s.size * 8 - 1)
+
+                funcs["%s%s_min" % (prefix, name)] = min_
+                funcs["%s%s_max" % (prefix, name)] = max_
+                funcs["%sint%s_min" % (prefix, bits)] = min_
+                funcs["%sint%s_max" % (prefix, bits)] = max_
+
                funcs["%s%s%s" % (prefix, name, esuffix)] = unpack
                funcs["%sint%s%s" % (prefix, bits, esuffix)] = unpack
                funcs["%s%s%s_from" % (prefix, name, esuffix)] = unpack_from
@@ -259,8 +568,8 @@ class cdata(object):
    error = error

    bitswap = b''.join(
-        chr_(sum(((val >> i) & 1) << (7 - i) for i in range(8)))
-        for val in range(256))
+        chr_(sum(((val >> i) & 1) << (7 - i) for i in xrange(8)))
+        for val in xrange(256))

    test_bit = staticmethod(lambda value, n: bool((value >> n) & 1))

@@ -268,45 +577,210 @@ class cdata(object):
 _fill_cdata(cdata)


-def lock(fileobj):
-    """Lock a file object 'safely'.
+def get_size(fileobj):
+    """Returns the size of the file.
+    The position when passed in will be preserved if no error occurs.

-    That means a failure to lock because the platform doesn't
-    support fcntl or filesystem locks is not considered a
-    failure. This call does block.
-
-    Returns whether or not the lock was successful, or
-    raises an exception in more extreme circumstances (full
-    lock table, invalid file).
+    Args:
+        fileobj (fileobj)
+    Returns:
+        int: The size of the file
+    Raises:
+        IOError
    """

+    old_pos = fileobj.tell()
+    try:
+        fileobj.seek(0, 2)
+        return fileobj.tell()
+    finally:
+        fileobj.seek(old_pos, 0)
+
+
+def read_full(fileobj, size):
+    """Like fileobj.read but raises IOError if no all requested data is
+    returned.
+
+    If you want to distinguish IOError and the EOS case, better handle
+    the error yourself instead of using this.
+
+    Args:
+        fileobj (fileobj)
+        size (int): amount of bytes to read
+    Raises:
+        IOError: In case read fails or not enough data is read
+    """
+
+    if size < 0:
+        raise ValueError("size must not be negative")
+
+    data = fileobj.read(size)
+    if len(data) != size:
+        raise IOError
+    return data
+
+
+def seek_end(fileobj, offset):
+    """Like fileobj.seek(-offset, 2), but will not try to go beyond the start
+
+    Needed since file objects from BytesIO will not raise IOError and
+    file objects from open() will raise IOError if going to a negative offset.
+    To make things easier for custom implementations, instead of allowing
+    both behaviors, we just don't do it.
+
+    Args:
+        fileobj (fileobj)
+        offset (int): how many bytes away from the end backwards to seek to
+
+    Raises:
+        IOError
+    """
+
+    if offset < 0:
+        raise ValueError
+
+    if get_size(fileobj) < offset:
+        fileobj.seek(0, 0)
+    else:
+        fileobj.seek(-offset, 2)
+
+
+def mmap_move(fileobj, dest, src, count):
+    """Mmaps the file object if possible and moves 'count' data
+    from 'src' to 'dest'. All data has to be inside the file size
+    (enlarging the file through this function isn't possible)
+
+    Will adjust the file offset.
+
+    Args:
+        fileobj (fileobj)
+        dest (int): The destination offset
+        src (int): The source offset
+        count (int) The amount of data to move
+    Raises:
+        mmap.error: In case move failed
+        IOError: In case an operation on the fileobj fails
+        ValueError: In case invalid parameters were given
+    """
+
+    assert mmap is not None, "no mmap support"
+
+    if dest < 0 or src < 0 or count < 0:
+        raise ValueError("Invalid parameters")
+
    try:
-        import fcntl
-    except ImportError:
-        return False
-    else:
-        try:
-            fcntl.lockf(fileobj, fcntl.LOCK_EX)
-        except IOError:
-            # FIXME: There's possibly a lot of complicated
-            # logic that needs to go here in case the IOError
-            # is EACCES or EAGAIN.
-            return False
-        else:
-            return True
+        fileno = fileobj.fileno()
+    except (AttributeError, IOError):
+        raise mmap.error(
+            "File object does not expose/support a file descriptor")
+
+    fileobj.seek(0, 2)
+    filesize = fileobj.tell()
+    length = max(dest, src) + count
+
+    if length > filesize:
+        raise ValueError("Not in file size boundary")
+
+    offset = ((min(dest, src) // mmap.ALLOCATIONGRANULARITY) *
+              mmap.ALLOCATIONGRANULARITY)
+    assert dest >= offset
+    assert src >= offset
+    assert offset % mmap.ALLOCATIONGRANULARITY == 0
+
+    # Windows doesn't handle empty mappings, add a fast path here instead
+    if count == 0:
+        return
+
+    # fast path
+    if src == dest:
+        return
+
+    fileobj.flush()
+    file_map = mmap.mmap(fileno, length - offset, offset=offset)
+    try:
+        file_map.move(dest - offset, src - offset, count)
+    finally:
+        file_map.close()


-def unlock(fileobj):
-    """Unlock a file object.
+def resize_file(fobj, diff, BUFFER_SIZE=2 ** 16):
+    """Resize a file by `diff`.

-    Don't call this on a file object unless a call to lock()
-    returned true.
+    New space will be filled with zeros.
+
+    Args:
+        fobj (fileobj)
+        diff (int): amount of size to change
+    Raises:
+        IOError
    """

-    # If this fails there's a mismatched lock/unlock pair,
-    # so we definitely don't want to ignore errors.
-    import fcntl
-    fcntl.lockf(fileobj, fcntl.LOCK_UN)
+    fobj.seek(0, 2)
+    filesize = fobj.tell()
+
+    if diff < 0:
+        if filesize + diff < 0:
+            raise ValueError
+        # truncate flushes internally
+        fobj.truncate(filesize + diff)
+    elif diff > 0:
+        try:
+            while diff:
+                addsize = min(BUFFER_SIZE, diff)
+                fobj.write(b"\x00" * addsize)
+                diff -= addsize
+            fobj.flush()
+        except IOError as e:
+            if e.errno == errno.ENOSPC:
+                # To reduce the chance of corrupt files in case of missing
+                # space try to revert the file expansion back. Of course
+                # in reality every in-file-write can also fail due to COW etc.
+                # Note: IOError gets also raised in flush() due to buffering
+                fobj.truncate(filesize)
+            raise
+
+
+def fallback_move(fobj, dest, src, count, BUFFER_SIZE=2 ** 16):
+    """Moves data around using read()/write().
+
+    Args:
+        fileobj (fileobj)
+        dest (int): The destination offset
+        src (int): The source offset
+        count (int) The amount of data to move
+    Raises:
+        IOError: In case an operation on the fileobj fails
+        ValueError: In case invalid parameters were given
+    """
+
+    if dest < 0 or src < 0 or count < 0:
+        raise ValueError
+
+    fobj.seek(0, 2)
+    filesize = fobj.tell()
+
+    if max(dest, src) + count > filesize:
+        raise ValueError("area outside of file")
+
+    if src > dest:
+        moved = 0
+        while count - moved:
+            this_move = min(BUFFER_SIZE, count - moved)
+            fobj.seek(src + moved)
+            buf = fobj.read(this_move)
+            fobj.seek(dest + moved)
+            fobj.write(buf)
+            moved += this_move
+        fobj.flush()
+    else:
+        while count:
+            this_move = min(BUFFER_SIZE, count)
+            fobj.seek(src + count - this_move)
+            buf = fobj.read(this_move)
+            fobj.seek(count + dest - this_move)
+            fobj.write(buf)
+            count -= this_move
+        fobj.flush()


 def insert_bytes(fobj, size, offset, BUFFER_SIZE=2 ** 16):
@@ -315,60 +789,34 @@ def insert_bytes(fobj, size, offset, BUFFER_SIZE=2 ** 16):
    fobj must be an open file object, open rb+ or
    equivalent. Mutagen tries to use mmap to resize the file, but
    falls back to a significantly slower method if mmap fails.
+
+    Args:
+        fobj (fileobj)
+        size (int): The amount of space to insert
+        offset (int): The offset at which to insert the space
+    Raises:
+        IOError
    """

-    assert 0 < size
-    assert 0 <= offset
-    locked = False
+    if size < 0 or offset < 0:
+        raise ValueError
+
    fobj.seek(0, 2)
    filesize = fobj.tell()
    movesize = filesize - offset
-    fobj.write(b'\x00' * size)
-    fobj.flush()
-    try:
+
+    if movesize < 0:
+        raise ValueError
+
+    resize_file(fobj, size, BUFFER_SIZE)
+
+    if mmap is not None:
        try:
-            import mmap
-            file_map = mmap.mmap(fobj.fileno(), filesize + size)
-            try:
-                file_map.move(offset + size, offset, movesize)
-            finally:
-                file_map.close()
-        except (ValueError, EnvironmentError, ImportError):
-            # handle broken mmap scenarios
-            locked = lock(fobj)
-            fobj.truncate(filesize)
-
-            fobj.seek(0, 2)
-            padsize = size
-            # Don't generate an enormous string if we need to pad
-            # the file out several megs.
-            while padsize:
-                addsize = min(BUFFER_SIZE, padsize)
-                fobj.write(b"\x00" * addsize)
-                padsize -= addsize
-
-            fobj.seek(filesize, 0)
-            while movesize:
-                # At the start of this loop, fobj is pointing at the end
-                # of the data we need to move, which is of movesize length.
-                thismove = min(BUFFER_SIZE, movesize)
-                # Seek back however much we're going to read this frame.
-                fobj.seek(-thismove, 1)
-                nextpos = fobj.tell()
-                # Read it, so we're back at the end.
-                data = fobj.read(thismove)
-                # Seek back to where we need to write it.
-                fobj.seek(-thismove + size, 1)
-                # Write it.
-                fobj.write(data)
-                # And seek back to the end of the unmoved data.
-                fobj.seek(nextpos)
-                movesize -= thismove
-
-            fobj.flush()
-    finally:
-        if locked:
-            unlock(fobj)
+            mmap_move(fobj, offset + size, offset, movesize)
+        except mmap.error:
+            fallback_move(fobj, offset + size, offset, movesize, BUFFER_SIZE)
+    else:
+        fallback_move(fobj, offset + size, offset, movesize, BUFFER_SIZE)


 def delete_bytes(fobj, size, offset, BUFFER_SIZE=2 ** 16):
@@ -377,46 +825,71 @@ def delete_bytes(fobj, size, offset, BUFFER_SIZE=2 ** 16):
    fobj must be an open file object, open rb+ or
    equivalent. Mutagen tries to use mmap to resize the file, but
    falls back to a significantly slower method if mmap fails.
+
+    Args:
+        fobj (fileobj)
+        size (int): The amount of space to delete
+        offset (int): The start of the space to delete
+    Raises:
+        IOError
    """

-    locked = False
-    assert 0 < size
-    assert 0 <= offset
+    if size < 0 or offset < 0:
+        raise ValueError
+
    fobj.seek(0, 2)
    filesize = fobj.tell()
    movesize = filesize - offset - size
-    assert 0 <= movesize
-    try:
-        if movesize > 0:
-            fobj.flush()
-            try:
-                import mmap
-                file_map = mmap.mmap(fobj.fileno(), filesize)
-                try:
-                    file_map.move(offset, offset + size, movesize)
-                finally:
-                    file_map.close()
-            except (ValueError, EnvironmentError, ImportError):
-                # handle broken mmap scenarios
-                locked = lock(fobj)
-                fobj.seek(offset + size)
-                buf = fobj.read(BUFFER_SIZE)
-                while buf:
-                    fobj.seek(offset)
-                    fobj.write(buf)
-                    offset += len(buf)
-                    fobj.seek(offset + size)
-                    buf = fobj.read(BUFFER_SIZE)
-        fobj.truncate(filesize - size)
-        fobj.flush()
-    finally:
-        if locked:
-            unlock(fobj)
+
+    if movesize < 0:
+        raise ValueError
+
+    if mmap is not None:
+        try:
+            mmap_move(fobj, offset, offset + size, movesize)
+        except mmap.error:
+            fallback_move(fobj, offset, offset + size, movesize, BUFFER_SIZE)
+    else:
+        fallback_move(fobj, offset, offset + size, movesize, BUFFER_SIZE)
+
+    resize_file(fobj, -size, BUFFER_SIZE)
+
+
+def resize_bytes(fobj, old_size, new_size, offset):
+    """Resize an area in a file adding and deleting at the end of it.
+    Does nothing if no resizing is needed.
+
+    Args:
+        fobj (fileobj)
+        old_size (int): The area starting at offset
+        new_size (int): The new size of the area
+        offset (int): The start of the area
+    Raises:
+        IOError
+    """
+
+    if new_size < old_size:
+        delete_size = old_size - new_size
+        delete_at = offset + new_size
+        delete_bytes(fobj, delete_size, delete_at)
+    elif new_size > old_size:
+        insert_size = new_size - old_size
+        insert_at = offset + old_size
+        insert_bytes(fobj, insert_size, insert_at)


 def dict_match(d, key, default=None):
    """Like __getitem__ but works as if the keys() are all filename patterns.
    Returns the value of any dict key that matches the passed key.
+
+    Args:
+        d (dict): A dict with filename patterns as keys
+        key (str): A key potentially matching any of the keys
+        default (object): The object to return if no pattern matched the
+            passed in key
+    Returns:
+        object: The dict value where the dict key matched the passed in key.
+            Or default if there was no match.
    """

    if key in d and "[" not in key:
@@ -428,15 +901,57 @@ def dict_match(d, key, default=None):
    return default


+def encode_endian(text, encoding, errors="strict", le=True):
+    """Like text.encode(encoding) but always returns little endian/big endian
+    BOMs instead of the system one.
+
+    Args:
+        text (text)
+        encoding (str)
+        errors (str)
+        le (boolean): if little endian
+    Returns:
+        bytes
+    Raises:
+        UnicodeEncodeError
+        LookupError
+    """
+
+    encoding = codecs.lookup(encoding).name
+
+    if encoding == "utf-16":
+        if le:
+            return codecs.BOM_UTF16_LE + text.encode("utf-16-le", errors)
+        else:
+            return codecs.BOM_UTF16_BE + text.encode("utf-16-be", errors)
+    elif encoding == "utf-32":
+        if le:
+            return codecs.BOM_UTF32_LE + text.encode("utf-32-le", errors)
+        else:
+            return codecs.BOM_UTF32_BE + text.encode("utf-32-be", errors)
+    else:
+        return text.encode(encoding, errors)
+
+
 def decode_terminated(data, encoding, strict=True):
    """Returns the decoded data until the first NULL terminator
    and all data after it.

-    In case the data can't be decoded raises UnicodeError.
-    In case the encoding is not found raises LookupError.
-    In case the data isn't null terminated (even if it is encoded correctly)
-    raises ValueError except if strict is False, then the decoded string
-    will be returned anyway.
+    Args:
+        data (bytes): data to decode
+        encoding (str): The codec to use
+        strict (bool): If True will raise ValueError in case no NULL is found
+            but the available data decoded successfully.
+    Returns:
+        Tuple[`text`, `bytes`]: A tuple containing the decoded text and the
+            remaining data after the found NULL termination.
+
+    Raises:
+        UnicodeError: In case the data can't be decoded.
+        LookupError:In case the encoding is not found.
+        ValueError: In case the data isn't null terminated (even if it is
+            encoded correctly) except if strict is False, then the decoded
+            string will be returned anyway.
    """

    codec_info = codecs.lookup(encoding)
@@ -472,47 +987,6 @@ def decode_terminated(data, encoding, strict=True):
        return u"".join(r), b""


-def split_escape(string, sep, maxsplit=None, escape_char="\\"):
-    """Like unicode/str/bytes.split but allows for the separator to be escaped
-
-    If passed unicode/str/bytes will only return list of unicode/str/bytes.
-    """
-
-    assert len(sep) == 1
-    assert len(escape_char) == 1
-
-    if isinstance(string, bytes):
-        if isinstance(escape_char, text_type):
-            escape_char = escape_char.encode("ascii")
-        iter_ = iterbytes
-    else:
-        iter_ = iter
-
-    if maxsplit is None:
-        maxsplit = len(string)
-
-    empty = string[:0]
-    result = []
-    current = empty
-    escaped = False
-    for char in iter_(string):
-        if escaped:
-            if char != escape_char and char != sep:
-                current += escape_char
-            current += char
-            escaped = False
-        else:
-            if char == escape_char:
-                escaped = True
-            elif char == sep and len(result) < maxsplit:
-                result.append(current)
-                current = empty
-            else:
-                current += char
-    result.append(current)
-    return result
-
-
 class BitReaderError(Exception):
    pass

@@ -1,11 +1,11 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2005-2006  Joe Wreschnig
 #                    2013  Christoph Reiter
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Read and write Vorbis comment data.

@@ -20,7 +20,7 @@ import sys

 import mutagen
 from ._compat import reraise, BytesIO, text_type, xrange, PY3, PY2
-from mutagen._util import DictMixin, cdata
+from mutagen._util import DictMixin, cdata, MutagenError


 def is_valid_key(key):
@@ -45,7 +45,7 @@ def is_valid_key(key):
 istag = is_valid_key


-class error(IOError):
+class error(MutagenError):
    pass


@@ -57,7 +57,7 @@ class VorbisEncodingError(error):
    pass


-class VComment(mutagen.Metadata, list):
+class VComment(mutagen.Tags, list):
    """A Vorbis comment parser, accessor, and renderer.

    All comment ordering is preserved. A VComment is a list of
@@ -68,13 +68,13 @@ class VComment(mutagen.Metadata, list):
    file-like object, not a filename.

    Attributes:
-
-    * vendor -- the stream 'vendor' (i.e. writer); default 'Mutagen'
+        vendor (text): the stream 'vendor' (i.e. writer); default 'Mutagen'
    """

    vendor = u"Mutagen " + mutagen.version_string

    def __init__(self, data=None, *args, **kwargs):
+        self._size = 0
        # Collect the args to pass to load, this lets child classes
        # override just load and get equivalent magic for the
        # constructor.
@@ -83,17 +83,18 @@ class VComment(mutagen.Metadata, list):
                data = BytesIO(data)
            elif not hasattr(data, 'read'):
                raise TypeError("VComment requires bytes or a file-like")
+            start = data.tell()
            self.load(data, *args, **kwargs)
+            self._size = data.tell() - start

    def load(self, fileobj, errors='replace', framing=True):
        """Parse a Vorbis comment from a file-like object.

-        Keyword arguments:
-
-        * errors:
-            'strict', 'replace', or 'ignore'. This affects Unicode decoding
-            and how other malformed content is interpreted.
-        * framing -- if true, fail if a framing bit is not present
+        Arguments:
+            errors (str): 'strict', 'replace', or 'ignore'.
+                This affects Unicode decoding and how other malformed content
+                is interpreted.
+            framing (bool): if true, fail if a framing bit is not present

        Framing bits are required by the Vorbis comment specification,
        but are not used in FLAC Vorbis comment blocks.
@@ -183,9 +184,8 @@ class VComment(mutagen.Metadata, list):
        Validation is always performed, so calling this function on
        invalid data may raise a ValueError.

-        Keyword arguments:
-
-        * framing -- if true, append a framing bit (see load)
+        Arguments:
+            framing (bool): if true, append a framing bit (see load)
        """

        self.validate()
@@ -2,8 +2,9 @@
 # Copyright (C) 2014 Christoph Reiter
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """
 * ADTS - Audio Data Transport Stream
@@ -13,7 +14,9 @@

 from mutagen import StreamInfo
 from mutagen._file import FileType
-from mutagen._util import BitReader, BitReaderError, MutagenError
+from mutagen._util import BitReader, BitReaderError, MutagenError, loadfile, \
+    convert_error
+from mutagen.id3._util import BitPaddedInt
 from mutagen._compat import endswith, xrange


@@ -262,16 +265,16 @@ class AACError(MutagenError):


 class AACInfo(StreamInfo):
-    """AAC stream information.
+    """AACInfo()
+
+    AAC stream information.
+    The length of the stream is just a guess and might not be correct.

    Attributes:
-
-    * channels -- number of audio channels
-    * length -- file length in seconds, as a float
-    * sample_rate -- audio sampling rate in Hz
-    * bitrate -- audio bitrate, in bits per second
-
-    The length of the stream is just a guess and might not be correct.
+        channels (`int`): number of audio channels
+        length (`float`): file length in seconds, as a float
+        sample_rate (`int`): audio sampling rate in Hz
+        bitrate (`int`): audio bitrate, in bits per second
    """

    channels = 0
@@ -279,11 +282,13 @@ class AACInfo(StreamInfo):
    sample_rate = 0
    bitrate = 0

+    @convert_error(IOError, AACError)
    def __init__(self, fileobj):
+        """Raises AACError"""
+
        # skip id3v2 header
        start_offset = 0
        header = fileobj.read(10)
-        from mutagen.id3 import BitPaddedInt
        if header.startswith(b"ID3"):
            size = BitPaddedInt(header[6:])
            start_offset = size + 10
@@ -373,24 +378,34 @@ class AACInfo(StreamInfo):
        self.length = float(s.samples * stream_size) / (s.size * s.frequency)

    def pprint(self):
-        return "AAC (%s), %d Hz, %.2f seconds, %d channel(s), %d bps" % (
+        return u"AAC (%s), %d Hz, %.2f seconds, %d channel(s), %d bps" % (
            self._type, self.sample_rate, self.length, self.channels,
            self.bitrate)


 class AAC(FileType):
-    """Load ADTS or ADIF streams containing AAC.
+    """AAC(filething)
+
+    Arguments:
+        filething (filething)
+
+    Load ADTS or ADIF streams containing AAC.

    Tagging is not supported.
    Use the ID3/APEv2 classes directly instead.
+
+    Attributes:
+        info (`AACInfo`)
    """

    _mimes = ["audio/x-aac"]

-    def load(self, filename):
-        self.filename = filename
-        with open(filename, "rb") as h:
-            self.info = AACInfo(h)
+    @loadfile()
+    def load(self, filething):
+        self.info = AACInfo(filething.fileobj)
+
+    def add_tags(self):
+        raise AACError("doesn't support tags")

    @staticmethod
    def score(filename, fileobj, header):
@@ -1,36 +1,34 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2014  Evan Purkhiser
 #               2014  Ben Ockmore
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """AIFF audio stream information and tags."""

-# NOTE from Ben Ockmore - according to the Py3k migration guidelines, AIFF
-# chunk keys should be unicode in Py3k, and unicode or bytes in Py2k (ASCII).
-# To make this easier, chunk keys should be stored internally as unicode.
-
+import sys
 import struct
 from struct import pack

-from ._compat import endswith, text_type, PY3
+from ._compat import endswith, text_type, reraise
 from mutagen import StreamInfo, FileType

 from mutagen.id3 import ID3
-from mutagen.id3._util import error as ID3Error
-from mutagen._util import insert_bytes, delete_bytes, MutagenError
+from mutagen.id3._util import ID3NoHeaderError, error as ID3Error
+from mutagen._util import resize_bytes, delete_bytes, MutagenError, loadfile, \
+    convert_error

 __all__ = ["AIFF", "Open", "delete"]


-class error(MutagenError, RuntimeError):
+class error(MutagenError):
    pass


-class InvalidChunk(error, IOError):
+class InvalidChunk(error):
    pass


@@ -39,14 +37,7 @@ _HUGE_VAL = 1.79769313486231e+308


 def is_valid_chunk_id(id):
-    if not isinstance(id, text_type):
-        if PY3:
-            raise TypeError("AIFF chunk must be unicode")
-
-        try:
-            id = id.decode('ascii')
-        except UnicodeDecodeError:
-            return False
+    assert isinstance(id, text_type)

    return ((len(id) <= 4) and (min(id) >= u' ') and
            (max(id) <= u'~'))
@@ -85,37 +76,59 @@ class IFFChunk(object):

        self.id, self.data_size = struct.unpack('>4si', header)

-        if not isinstance(self.id, text_type):
+        try:
            self.id = self.id.decode('ascii')
+        except UnicodeDecodeError:
+            raise InvalidChunk()

        if not is_valid_chunk_id(self.id):
            raise InvalidChunk()

        self.size = self.HEADER_SIZE + self.data_size
        self.data_offset = fileobj.tell()
-        self.data = None

    def read(self):
        """Read the chunks data"""
+
        self.__fileobj.seek(self.data_offset)
-        self.data = self.__fileobj.read(self.data_size)
+        return self.__fileobj.read(self.data_size)
+
+    def write(self, data):
+        """Write the chunk data"""
+
+        if len(data) > self.data_size:
+            raise ValueError
+
+        self.__fileobj.seek(self.data_offset)
+        self.__fileobj.write(data)

    def delete(self):
        """Removes the chunk from the file"""
+
        delete_bytes(self.__fileobj, self.size, self.offset)
        if self.parent_chunk is not None:
-            self.parent_chunk.resize(self.parent_chunk.data_size - self.size)
+            self.parent_chunk._update_size(
+                self.parent_chunk.data_size - self.size)

-    def resize(self, data_size):
+    def _update_size(self, data_size):
        """Update the size of the chunk"""
+
        self.__fileobj.seek(self.offset + 4)
        self.__fileobj.write(pack('>I', data_size))
        if self.parent_chunk is not None:
            size_diff = self.data_size - data_size
-            self.parent_chunk.resize(self.parent_chunk.data_size - size_diff)
+            self.parent_chunk._update_size(
+                self.parent_chunk.data_size - size_diff)
        self.data_size = data_size
        self.size = data_size + self.HEADER_SIZE

+    def resize(self, new_data_size):
+        """Resize the file and update the chunk sizes"""
+
+        resize_bytes(
+            self.__fileobj, self.data_size, new_data_size, self.data_offset)
+        self._update_size(new_data_size)
+

 class IFFFile(object):
    """Representation of a IFF file"""
@@ -154,8 +167,7 @@ class IFFFile(object):
    def __contains__(self, id_):
        """Check if the IFF file contains a specific chunk"""

-        if not isinstance(id_, text_type):
-            id_ = id_.decode('ascii')
+        assert isinstance(id_, text_type)

        if not is_valid_chunk_id(id_):
            raise KeyError("AIFF key must be four ASCII characters.")
@@ -165,8 +177,7 @@ class IFFFile(object):
    def __getitem__(self, id_):
        """Get a chunk from the IFF file"""

-        if not isinstance(id_, text_type):
-            id_ = id_.decode('ascii')
+        assert isinstance(id_, text_type)

        if not is_valid_chunk_id(id_):
            raise KeyError("AIFF key must be four ASCII characters.")
@@ -175,13 +186,12 @@ class IFFFile(object):
            return self.__chunks[id_]
        except KeyError:
            raise KeyError(
-                "%r has no %r chunk" % (self.__fileobj.name, id_))
+                "%r has no %r chunk" % (self.__fileobj, id_))

    def __delitem__(self, id_):
        """Remove a chunk from the IFF file"""

-        if not isinstance(id_, text_type):
-            id_ = id_.decode('ascii')
+        assert isinstance(id_, text_type)

        if not is_valid_chunk_id(id_):
            raise KeyError("AIFF key must be four ASCII characters.")
@@ -191,8 +201,7 @@ class IFFFile(object):
    def insert_chunk(self, id_):
        """Insert a new chunk at the end of the IFF file"""

-        if not isinstance(id_, text_type):
-            id_ = id_.decode('ascii')
+        assert isinstance(id_, text_type)

        if not is_valid_chunk_id(id_):
            raise KeyError("AIFF key must be four ASCII characters.")
@@ -201,24 +210,25 @@ class IFFFile(object):
        self.__fileobj.write(pack('>4si', id_.ljust(4).encode('ascii'), 0))
        self.__fileobj.seek(self.__next_offset)
        chunk = IFFChunk(self.__fileobj, self[u'FORM'])
-        self[u'FORM'].resize(self[u'FORM'].data_size + chunk.size)
+        self[u'FORM']._update_size(self[u'FORM'].data_size + chunk.size)

        self.__chunks[id_] = chunk
        self.__next_offset = chunk.offset + chunk.size


 class AIFFInfo(StreamInfo):
-    """AIFF audio stream information.
+    """AIFFInfo()
+
+    AIFF audio stream information.

    Information is parsed from the COMM chunk of the AIFF file

-    Useful attributes:
-
-    * length -- audio length, in seconds
-    * bitrate -- audio bitrate, in bits per second
-    * channels -- The number of audio channels
-    * sample_rate -- audio sample rate, in Hz
-    * sample_size -- The audio sample size
+    Attributes:
+        length (`float`): audio length, in seconds
+        bitrate (`int`): audio bitrate, in bits per second
+        channels (`int`): The number of audio channels
+        sample_rate (`int`): audio sample rate, in Hz
+        sample_size (`int`): The audio sample size
    """

    length = 0
@@ -226,16 +236,21 @@ class AIFFInfo(StreamInfo):
    channels = 0
    sample_rate = 0

+    @convert_error(IOError, error)
    def __init__(self, fileobj):
+        """Raises error"""
+
        iff = IFFFile(fileobj)
        try:
            common_chunk = iff[u'COMM']
        except KeyError as e:
            raise error(str(e))

-        common_chunk.read()
+        data = common_chunk.read()
+        if len(data) < 18:
+            raise error

-        info = struct.unpack('>hLh10s', common_chunk.data[:18])
+        info = struct.unpack('>hLh10s', data[:18])
        channels, frame_count, sample_size, sample_rate = info

        self.sample_rate = int(read_float(sample_rate))
@@ -245,86 +260,78 @@ class AIFFInfo(StreamInfo):
        self.length = frame_count / float(self.sample_rate)

    def pprint(self):
-        return "%d channel AIFF @ %d bps, %s Hz, %.2f seconds" % (
+        return u"%d channel AIFF @ %d bps, %s Hz, %.2f seconds" % (
            self.channels, self.bitrate, self.sample_rate, self.length)


 class _IFFID3(ID3):
    """A AIFF file with ID3v2 tags"""

-    def _load_header(self):
+    def _pre_load_header(self, fileobj):
        try:
-            self._fileobj.seek(IFFFile(self._fileobj)[u'ID3'].data_offset)
+            fileobj.seek(IFFFile(fileobj)[u'ID3'].data_offset)
        except (InvalidChunk, KeyError):
-            raise ID3Error()
-        super(_IFFID3, self)._load_header()
+            raise ID3NoHeaderError("No ID3 chunk")

-    def save(self, filename=None, v2_version=4, v23_sep='/'):
+    @convert_error(IOError, error)
+    @loadfile(writable=True)
+    def save(self, filething, v2_version=4, v23_sep='/', padding=None):
        """Save ID3v2 data to the AIFF file"""

-        framedata = self._prepare_framedata(v2_version, v23_sep)
-        framesize = len(framedata)
+        fileobj = filething.fileobj

-        if filename is None:
-            filename = self.filename
-
-        # Unlike the parent ID3.save method, we won't save to a blank file
-        # since we would have to construct a empty AIFF file
-        fileobj = open(filename, 'rb+')
        iff_file = IFFFile(fileobj)

+        if u'ID3' not in iff_file:
+            iff_file.insert_chunk(u'ID3')
+
+        chunk = iff_file[u'ID3']
+
        try:
-            if u'ID3' not in iff_file:
-                iff_file.insert_chunk(u'ID3')
+            data = self._prepare_data(
+                fileobj, chunk.data_offset, chunk.data_size, v2_version,
+                v23_sep, padding)
+        except ID3Error as e:
+            reraise(error, e, sys.exc_info()[2])

-            chunk = iff_file[u'ID3']
-            fileobj.seek(chunk.data_offset)
+        new_size = len(data)
+        new_size += new_size % 2  # pad byte
+        assert new_size % 2 == 0
+        chunk.resize(new_size)
+        data += (new_size - len(data)) * b'\x00'
+        assert new_size == len(data)
+        chunk.write(data)

-            header = fileobj.read(10)
-            header = self._prepare_id3_header(header, framesize, v2_version)
-            header, new_size, _ = header
-
-            data = header + framedata + (b'\x00' * (new_size - framesize))
-
-            # Include ID3 header size in 'new_size' calculation
-            new_size += 10
-
-            # Expand the chunk if necessary, including pad byte
-            if new_size > chunk.size:
-                insert_at = chunk.offset + chunk.size
-                insert_size = new_size - chunk.size + new_size % 2
-                insert_bytes(fileobj, insert_size, insert_at)
-                chunk.resize(new_size)
-
-            fileobj.seek(chunk.data_offset)
-            fileobj.write(data)
-        finally:
-            fileobj.close()
-
-    def delete(self, filename=None):
+    @loadfile(writable=True)
+    def delete(self, filething):
        """Completely removes the ID3 chunk from the AIFF file"""

-        if filename is None:
-            filename = self.filename
-        delete(filename)
+        delete(filething)
        self.clear()


-def delete(filename):
+@convert_error(IOError, error)
+@loadfile(method=False, writable=True)
+def delete(filething):
    """Completely removes the ID3 chunk from the AIFF file"""

-    with open(filename, "rb+") as file_:
-        try:
-            del IFFFile(file_)[u'ID3']
-        except KeyError:
-            pass
+    try:
+        del IFFFile(filething.fileobj)[u'ID3']
+    except KeyError:
+        pass


 class AIFF(FileType):
-    """An AIFF audio file.
+    """AIFF(filething)

-    :ivar info: :class:`AIFFInfo`
-    :ivar tags: :class:`ID3`
+    An AIFF audio file.
+
+    Arguments:
+        filething (filething)
+
+    Attributes:
+        tags (`mutagen.id3.ID3`)
+        info (`AIFFInfo`)
    """

    _mimes = ["audio/aiff", "audio/x-aiff"]
@@ -343,20 +350,24 @@ class AIFF(FileType):
        else:
            raise error("an ID3 tag already exists")

-    def load(self, filename, **kwargs):
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething, **kwargs):
        """Load stream and tag information from a file."""
-        self.filename = filename
+
+        fileobj = filething.fileobj

        try:
-            self.tags = _IFFID3(filename, **kwargs)
-        except ID3Error:
+            self.tags = _IFFID3(fileobj, **kwargs)
+        except ID3NoHeaderError:
            self.tags = None
+        except ID3Error as e:
+            raise error(e)
+        else:
+            self.tags.filename = self.filename

-        try:
-            fileobj = open(filename, "rb")
-            self.info = AIFFInfo(fileobj)
-        finally:
-            fileobj.close()
+        fileobj.seek(0, 0)
+        self.info = AIFFInfo(fileobj)


 Open = AIFF
@@ -1,10 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2005  Joe Wreschnig
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """APEv2 reading and writing.

@@ -37,8 +37,8 @@ from collections import MutableSequence
 from ._compat import (cBytesIO, PY3, text_type, PY2, reraise, swap_to_string,
                      xrange)
 from mutagen import Metadata, FileType, StreamInfo
-from mutagen._util import (DictMixin, cdata, delete_bytes, total_ordering,
-                           MutagenError)
+from mutagen._util import DictMixin, cdata, delete_bytes, total_ordering, \
+    MutagenError, loadfile, convert_error, seek_end, get_size


 def is_valid_apev2_key(key):
@@ -61,26 +61,26 @@ def is_valid_apev2_key(key):
 #  1: Item contains binary information
 #  2: Item is a locator of external stored information [e.g. URL]
 #  3: reserved"
-TEXT, BINARY, EXTERNAL = range(3)
+TEXT, BINARY, EXTERNAL = xrange(3)

 HAS_HEADER = 1 << 31
 HAS_NO_FOOTER = 1 << 30
 IS_HEADER = 1 << 29


-class error(IOError, MutagenError):
+class error(MutagenError):
    pass


-class APENoHeaderError(error, ValueError):
+class APENoHeaderError(error):
    pass


-class APEUnsupportedVersionError(error, ValueError):
+class APEUnsupportedVersionError(error):
    pass


-class APEBadItemError(error, ValueError):
+class APEBadItemError(error):
    pass


@@ -103,6 +103,8 @@ class _APEv2Data(object):
    is_at_start = False

    def __init__(self, fileobj):
+        """Raises IOError and apev2.error"""
+
        self.__find_metadata(fileobj)

        if self.header is None:
@@ -137,6 +139,8 @@ class _APEv2Data(object):

        # Check for an APEv2 tag followed by an ID3v1 tag at the end.
        try:
+            if get_size(fileobj) < 128:
+                raise IOError
            fileobj.seek(-128, 2)
            if fileobj.read(3) == b"TAG":

@@ -173,11 +177,18 @@ class _APEv2Data(object):
            self.header = 0

    def __fill_missing(self, fileobj):
+        """Raises IOError and apev2.error"""
+
        fileobj.seek(self.metadata + 8)
-        self.version = fileobj.read(4)
-        self.size = cdata.uint_le(fileobj.read(4))
-        self.items = cdata.uint_le(fileobj.read(4))
-        self.flags = cdata.uint_le(fileobj.read(4))
+
+        data = fileobj.read(16)
+        if len(data) != 16:
+            raise error
+
+        self.version = data[:4]
+        self.size = cdata.uint32_le(data[4:8])
+        self.items = cdata.uint32_le(data[8:12])
+        self.flags = cdata.uint32_le(data[12:])

        if self.header is not None:
            self.data = self.header + 32
@@ -256,7 +267,9 @@ class _CIDictProxy(DictMixin):


 class APEv2(_CIDictProxy, Metadata):
-    """A file with an APEv2 tag.
+    """APEv2(filething=None)
+
+    A file with an APEv2 tag.

    ID3v1 tags are silently ignored and overwritten.
    """
@@ -269,15 +282,16 @@ class APEv2(_CIDictProxy, Metadata):
        items = sorted(self.items())
        return u"\n".join(u"%s=%s" % (k, v.pprint()) for k, v in items)

-    def load(self, filename):
-        """Load tags from a filename."""
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething):
+        """Load tags from a filename.
+
+        Raises apev2.error
+        """
+
+        data = _APEv2Data(filething.fileobj)

-        self.filename = filename
-        fileobj = open(filename, "rb")
-        try:
-            data = _APEv2Data(fileobj)
-        finally:
-            fileobj.close()
        if data.tag:
            self.clear()
            self.__parse_tag(data.tag, data.items)
@@ -285,33 +299,45 @@ class APEv2(_CIDictProxy, Metadata):
            raise APENoHeaderError("No APE tag found")

    def __parse_tag(self, tag, count):
+        """Raises IOError and APEBadItemError"""
+
        fileobj = cBytesIO(tag)

        for i in xrange(count):
-            size_data = fileobj.read(4)
+            tag_data = fileobj.read(8)
            # someone writes wrong item counts
-            if not size_data:
+            if not tag_data:
                break
-            size = cdata.uint_le(size_data)
-            flags = cdata.uint_le(fileobj.read(4))
+            if len(tag_data) != 8:
+                raise error
+            size = cdata.uint32_le(tag_data[:4])
+            flags = cdata.uint32_le(tag_data[4:8])

            # Bits 1 and 2 bits are flags, 0-3
            # Bit 0 is read/write flag, ignored
            kind = (flags & 6) >> 1
            if kind == 3:
                raise APEBadItemError("value type must be 0, 1, or 2")
+
            key = value = fileobj.read(1)
+            if not key:
+                raise APEBadItemError
            while key[-1:] != b'\x00' and value:
                value = fileobj.read(1)
+                if not value:
+                    raise APEBadItemError
                key += value
            if key[-1:] == b"\x00":
                key = key[:-1]
+
            if PY3:
                try:
                    key = key.decode("ascii")
                except UnicodeError as err:
                    reraise(APEBadItemError, err, sys.exc_info()[2])
            value = fileobj.read(size)
+            if len(value) != size:
+                raise APEBadItemError

            value = _get_value_type(kind)._new(value)

@@ -391,7 +417,9 @@ class APEv2(_CIDictProxy, Metadata):

        super(APEv2, self).__setitem__(key, value)

-    def save(self, filename=None):
+    @convert_error(IOError, error)
+    @loadfile(writable=True, create=True)
+    def save(self, filething):
        """Save changes to a file.

        If no filename is given, the one most recently loaded is used.
@@ -400,11 +428,8 @@ class APEv2(_CIDictProxy, Metadata):
        a header and a footer.
        """

-        filename = filename or self.filename
-        try:
-            fileobj = open(filename, "r+b")
-        except IOError:
-            fileobj = open(filename, "w+b")
+        fileobj = filething.fileobj
+
        data = _APEv2Data(fileobj)

        if data.is_at_start:
@@ -453,32 +478,41 @@ class APEv2(_CIDictProxy, Metadata):
        footer += b"\0" * 8

        fileobj.write(footer)
-        fileobj.close()

-    def delete(self, filename=None):
+    @convert_error(IOError, error)
+    @loadfile(writable=True)
+    def delete(self, filething):
        """Remove tags from a file."""

-        filename = filename or self.filename
-        fileobj = open(filename, "r+b")
-        try:
-            data = _APEv2Data(fileobj)
-            if data.start is not None and data.size is not None:
-                delete_bytes(fileobj, data.end - data.start, data.start)
-        finally:
-            fileobj.close()
+        fileobj = filething.fileobj
+        data = _APEv2Data(fileobj)
+        if data.start is not None and data.size is not None:
+            delete_bytes(fileobj, data.end - data.start, data.start)
        self.clear()


 Open = APEv2


-def delete(filename):
-    """Remove tags from a file."""
+@convert_error(IOError, error)
+@loadfile(method=False, writable=True)
+def delete(filething):
+    """delete(filething)
+
+    Arguments:
+        filething (filething)
+    Raises:
+        mutagen.MutagenError
+
+    Remove tags from a file.
+    """

    try:
-        APEv2(filename).delete()
+        t = APEv2(filething)
    except APENoHeaderError:
-        pass
+        return
+    filething.fileobj.seek(0)
+    t.delete(filething)


 def _get_value_type(kind):
@@ -679,6 +713,15 @@ class APEExtValue(_APEUtf8Value):


 class APEv2File(FileType):
+    """APEv2File(filething)
+
+    Arguments:
+        filething (filething)
+
+    Attributes:
+        tags (`APEv2`)
+    """
+
    class _Info(StreamInfo):
        length = 0
        bitrate = 0
@@ -690,11 +733,18 @@ class APEv2File(FileType):
        def pprint():
            return u"Unknown format with APEv2 tag."

-    def load(self, filename):
-        self.filename = filename
-        self.info = self._Info(open(filename, "rb"))
+    @loadfile()
+    def load(self, filething):
+        fileobj = filething.fileobj
+
+        self.info = self._Info(fileobj)
        try:
-            self.tags = APEv2(filename)
+            fileobj.seek(0, 0)
+        except IOError as e:
+            raise error(e)
+
+        try:
+            self.tags = APEv2(fileobj)
        except APENoHeaderError:
            self.tags = None

@@ -702,13 +752,13 @@ class APEv2File(FileType):
        if self.tags is None:
            self.tags = APEv2()
        else:
-            raise ValueError("%r already has tags: %r" % (self, self.tags))
+            raise error("%r already has tags: %r" % (self, self.tags))

    @staticmethod
    def score(filename, fileobj, header):
        try:
-            fileobj.seek(-160, 2)
+            seek_end(fileobj, 160)
+            footer = fileobj.read()
        except IOError:
-            fileobj.seek(0)
-        footer = fileobj.read()
+            return -1
        return ((b"APETAGEX" in footer) - header.startswith(b"ID3"))
@@ -1,862 +0,0 @@
-# -*- coding: utf-8 -*-
-
-# Copyright (C) 2005-2006  Joe Wreschnig
-# Copyright (C) 2006-2007  Lukas Lalinsky
-
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
-
-"""Read and write ASF (Window Media Audio) files."""
-
-__all__ = ["ASF", "Open"]
-
-import sys
-import struct
-from mutagen import FileType, Metadata, StreamInfo
-from mutagen._util import (insert_bytes, delete_bytes, DictMixin,
-                           total_ordering, MutagenError)
-from ._compat import swap_to_string, text_type, PY2, string_types, reraise, \
-    xrange, long_, PY3
-
-
-class error(IOError, MutagenError):
-    pass
-
-
-class ASFError(error):
-    pass
-
-
-class ASFHeaderError(error):
-    pass
-
-
-class ASFInfo(StreamInfo):
-    """ASF stream information."""
-
-    def __init__(self):
-        self.length = 0.0
-        self.sample_rate = 0
-        self.bitrate = 0
-        self.channels = 0
-
-    def pprint(self):
-        s = "Windows Media Audio %d bps, %s Hz, %d channels, %.2f seconds" % (
-            self.bitrate, self.sample_rate, self.channels, self.length)
-        return s
-
-
-class ASFTags(list, DictMixin, Metadata):
-    """Dictionary containing ASF attributes."""
-
-    def pprint(self):
-        return "\n".join("%s=%s" % (k, v) for k, v in self)
-
-    def __getitem__(self, key):
-        """A list of values for the key.
-
-        This is a copy, so comment['title'].append('a title') will not
-        work.
-
-        """
-
-        # PY3 only
-        if isinstance(key, slice):
-            return list.__getitem__(self, key)
-
-        values = [value for (k, value) in self if k == key]
-        if not values:
-            raise KeyError(key)
-        else:
-            return values
-
-    def __delitem__(self, key):
-        """Delete all values associated with the key."""
-
-        # PY3 only
-        if isinstance(key, slice):
-            return list.__delitem__(self, key)
-
-        to_delete = [x for x in self if x[0] == key]
-        if not to_delete:
-            raise KeyError(key)
-        else:
-            for k in to_delete:
-                self.remove(k)
-
-    def __contains__(self, key):
-        """Return true if the key has any values."""
-        for k, value in self:
-            if k == key:
-                return True
-        else:
-            return False
-
-    def __setitem__(self, key, values):
-        """Set a key's value or values.
-
-        Setting a value overwrites all old ones. The value may be a
-        list of Unicode or UTF-8 strings, or a single Unicode or UTF-8
-        string.
-
-        """
-
-        # PY3 only
-        if isinstance(key, slice):
-            return list.__setitem__(self, key, values)
-
-        if not isinstance(values, list):
-            values = [values]
-
-        to_append = []
-        for value in values:
-            if not isinstance(value, ASFBaseAttribute):
-                if isinstance(value, string_types):
-                    value = ASFUnicodeAttribute(value)
-                elif PY3 and isinstance(value, bytes):
-                    value = ASFByteArrayAttribute(value)
-                elif isinstance(value, bool):
-                    value = ASFBoolAttribute(value)
-                elif isinstance(value, int):
-                    value = ASFDWordAttribute(value)
-                elif isinstance(value, long_):
-                    value = ASFQWordAttribute(value)
-                else:
-                    raise TypeError("Invalid type %r" % type(value))
-            to_append.append((key, value))
-
-        try:
-            del(self[key])
-        except KeyError:
-            pass
-
-        self.extend(to_append)
-
-    def keys(self):
-        """Return all keys in the comment."""
-        return self and set(next(iter(zip(*self))))
-
-    def as_dict(self):
-        """Return a copy of the comment data in a real dict."""
-        d = {}
-        for key, value in self:
-            d.setdefault(key, []).append(value)
-        return d
-
-
-class ASFBaseAttribute(object):
-    """Generic attribute."""
-    TYPE = None
-
-    def __init__(self, value=None, data=None, language=None,
-                 stream=None, **kwargs):
-        self.language = language
-        self.stream = stream
-        if data:
-            self.value = self.parse(data, **kwargs)
-        else:
-            if value is None:
-                # we used to support not passing any args and instead assign
-                # them later, keep that working..
-                self.value = None
-            else:
-                self.value = self._validate(value)
-
-    def _validate(self, value):
-        """Raises TypeError or ValueError in case the user supplied value
-        isn't valid.
-        """
-
-        return value
-
-    def data_size(self):
-        raise NotImplementedError
-
-    def __repr__(self):
-        name = "%s(%r" % (type(self).__name__, self.value)
-        if self.language:
-            name += ", language=%d" % self.language
-        if self.stream:
-            name += ", stream=%d" % self.stream
-        name += ")"
-        return name
-
-    def render(self, name):
-        name = name.encode("utf-16-le") + b"\x00\x00"
-        data = self._render()
-        return (struct.pack("<H", len(name)) + name +
-                struct.pack("<HH", self.TYPE, len(data)) + data)
-
-    def render_m(self, name):
-        name = name.encode("utf-16-le") + b"\x00\x00"
-        if self.TYPE == 2:
-            data = self._render(dword=False)
-        else:
-            data = self._render()
-        return (struct.pack("<HHHHI", 0, self.stream or 0, len(name),
-                            self.TYPE, len(data)) + name + data)
-
-    def render_ml(self, name):
-        name = name.encode("utf-16-le") + b"\x00\x00"
-        if self.TYPE == 2:
-            data = self._render(dword=False)
-        else:
-            data = self._render()
-
-        return (struct.pack("<HHHHI", self.language or 0, self.stream or 0,
-                            len(name), self.TYPE, len(data)) + name + data)
-
-
-@swap_to_string
-@total_ordering
-class ASFUnicodeAttribute(ASFBaseAttribute):
-    """Unicode string attribute."""
-    TYPE = 0x0000
-
-    def parse(self, data):
-        try:
-            return data.decode("utf-16-le").strip("\x00")
-        except UnicodeDecodeError as e:
-            reraise(ASFError, e, sys.exc_info()[2])
-
-    def _validate(self, value):
-        if not isinstance(value, text_type):
-            if PY2:
-                return value.decode("utf-8")
-            else:
-                raise TypeError("%r not str" % value)
-        return value
-
-    def _render(self):
-        return self.value.encode("utf-16-le") + b"\x00\x00"
-
-    def data_size(self):
-        return len(self._render())
-
-    def __bytes__(self):
-        return self.value.encode("utf-16-le")
-
-    def __str__(self):
-        return self.value
-
-    def __eq__(self, other):
-        return text_type(self) == other
-
-    def __lt__(self, other):
-        return text_type(self) < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFByteArrayAttribute(ASFBaseAttribute):
-    """Byte array attribute."""
-    TYPE = 0x0001
-
-    def parse(self, data):
-        assert isinstance(data, bytes)
-        return data
-
-    def _render(self):
-        assert isinstance(self.value, bytes)
-        return self.value
-
-    def _validate(self, value):
-        if not isinstance(value, bytes):
-            raise TypeError("must be bytes/str: %r" % value)
-        return value
-
-    def data_size(self):
-        return len(self.value)
-
-    def __bytes__(self):
-        return self.value
-
-    def __str__(self):
-        return "[binary data (%d bytes)]" % len(self.value)
-
-    def __eq__(self, other):
-        return self.value == other
-
-    def __lt__(self, other):
-        return self.value < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFBoolAttribute(ASFBaseAttribute):
-    """Bool attribute."""
-    TYPE = 0x0002
-
-    def parse(self, data, dword=True):
-        if dword:
-            return struct.unpack("<I", data)[0] == 1
-        else:
-            return struct.unpack("<H", data)[0] == 1
-
-    def _render(self, dword=True):
-        if dword:
-            return struct.pack("<I", bool(self.value))
-        else:
-            return struct.pack("<H", bool(self.value))
-
-    def _validate(self, value):
-        return bool(value)
-
-    def data_size(self):
-        return 4
-
-    def __bool__(self):
-        return bool(self.value)
-
-    def __bytes__(self):
-        return text_type(self.value).encode('utf-8')
-
-    def __str__(self):
-        return text_type(self.value)
-
-    def __eq__(self, other):
-        return bool(self.value) == other
-
-    def __lt__(self, other):
-        return bool(self.value) < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFDWordAttribute(ASFBaseAttribute):
-    """DWORD attribute."""
-    TYPE = 0x0003
-
-    def parse(self, data):
-        return struct.unpack("<L", data)[0]
-
-    def _render(self):
-        return struct.pack("<L", self.value)
-
-    def _validate(self, value):
-        value = int(value)
-        if not 0 <= value <= 2 ** 32 - 1:
-            raise ValueError("Out of range")
-        return value
-
-    def data_size(self):
-        return 4
-
-    def __int__(self):
-        return self.value
-
-    def __bytes__(self):
-        return text_type(self.value).encode('utf-8')
-
-    def __str__(self):
-        return text_type(self.value)
-
-    def __eq__(self, other):
-        return int(self.value) == other
-
-    def __lt__(self, other):
-        return int(self.value) < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFQWordAttribute(ASFBaseAttribute):
-    """QWORD attribute."""
-    TYPE = 0x0004
-
-    def parse(self, data):
-        return struct.unpack("<Q", data)[0]
-
-    def _render(self):
-        return struct.pack("<Q", self.value)
-
-    def _validate(self, value):
-        value = int(value)
-        if not 0 <= value <= 2 ** 64 - 1:
-            raise ValueError("Out of range")
-        return value
-
-    def data_size(self):
-        return 8
-
-    def __int__(self):
-        return self.value
-
-    def __bytes__(self):
-        return text_type(self.value).encode('utf-8')
-
-    def __str__(self):
-        return text_type(self.value)
-
-    def __eq__(self, other):
-        return int(self.value) == other
-
-    def __lt__(self, other):
-        return int(self.value) < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFWordAttribute(ASFBaseAttribute):
-    """WORD attribute."""
-    TYPE = 0x0005
-
-    def parse(self, data):
-        return struct.unpack("<H", data)[0]
-
-    def _render(self):
-        return struct.pack("<H", self.value)
-
-    def _validate(self, value):
-        value = int(value)
-        if not 0 <= value <= 2 ** 16 - 1:
-            raise ValueError("Out of range")
-        return value
-
-    def data_size(self):
-        return 2
-
-    def __int__(self):
-        return self.value
-
-    def __bytes__(self):
-        return text_type(self.value).encode('utf-8')
-
-    def __str__(self):
-        return text_type(self.value)
-
-    def __eq__(self, other):
-        return int(self.value) == other
-
-    def __lt__(self, other):
-        return int(self.value) < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-@swap_to_string
-@total_ordering
-class ASFGUIDAttribute(ASFBaseAttribute):
-    """GUID attribute."""
-    TYPE = 0x0006
-
-    def parse(self, data):
-        assert isinstance(data, bytes)
-        return data
-
-    def _render(self):
-        assert isinstance(self.value, bytes)
-        return self.value
-
-    def _validate(self, value):
-        if not isinstance(value, bytes):
-            raise TypeError("must be bytes/str: %r" % value)
-        return value
-
-    def data_size(self):
-        return len(self.value)
-
-    def __bytes__(self):
-        return self.value
-
-    def __str__(self):
-        return repr(self.value)
-
-    def __eq__(self, other):
-        return self.value == other
-
-    def __lt__(self, other):
-        return self.value < other
-
-    __hash__ = ASFBaseAttribute.__hash__
-
-
-UNICODE = ASFUnicodeAttribute.TYPE
-BYTEARRAY = ASFByteArrayAttribute.TYPE
-BOOL = ASFBoolAttribute.TYPE
-DWORD = ASFDWordAttribute.TYPE
-QWORD = ASFQWordAttribute.TYPE
-WORD = ASFWordAttribute.TYPE
-GUID = ASFGUIDAttribute.TYPE
-
-
-def ASFValue(value, kind, **kwargs):
-    try:
-        attr_type = _attribute_types[kind]
-    except KeyError:
-        raise ValueError("Unknown value type %r" % kind)
-    else:
-        return attr_type(value=value, **kwargs)
-
-
-_attribute_types = {
-    ASFUnicodeAttribute.TYPE: ASFUnicodeAttribute,
-    ASFByteArrayAttribute.TYPE: ASFByteArrayAttribute,
-    ASFBoolAttribute.TYPE: ASFBoolAttribute,
-    ASFDWordAttribute.TYPE: ASFDWordAttribute,
-    ASFQWordAttribute.TYPE: ASFQWordAttribute,
-    ASFWordAttribute.TYPE: ASFWordAttribute,
-    ASFGUIDAttribute.TYPE: ASFGUIDAttribute,
-}
-
-
-class BaseObject(object):
-    """Base ASF object."""
-    GUID = None
-
-    def parse(self, asf, data, fileobj, size):
-        self.data = data
-
-    def render(self, asf):
-        data = self.GUID + struct.pack("<Q", len(self.data) + 24) + self.data
-        return data
-
-
-class UnknownObject(BaseObject):
-    """Unknown ASF object."""
-    def __init__(self, guid):
-        assert isinstance(guid, bytes)
-        self.GUID = guid
-
-
-class HeaderObject(object):
-    """ASF header."""
-    GUID = b"\x30\x26\xB2\x75\x8E\x66\xCF\x11\xA6\xD9\x00\xAA\x00\x62\xCE\x6C"
-
-
-class ContentDescriptionObject(BaseObject):
-    """Content description."""
-    GUID = b"\x33\x26\xB2\x75\x8E\x66\xCF\x11\xA6\xD9\x00\xAA\x00\x62\xCE\x6C"
-
-    NAMES = [
-        u"Title",
-        u"Author",
-        u"Copyright",
-        u"Description",
-        u"Rating",
-    ]
-
-    def parse(self, asf, data, fileobj, size):
-        super(ContentDescriptionObject, self).parse(asf, data, fileobj, size)
-        asf.content_description_obj = self
-        lengths = struct.unpack("<HHHHH", data[:10])
-        texts = []
-        pos = 10
-        for length in lengths:
-            end = pos + length
-            if length > 0:
-                texts.append(data[pos:end].decode("utf-16-le").strip(u"\x00"))
-            else:
-                texts.append(None)
-            pos = end
-
-        for key, value in zip(self.NAMES, texts):
-            if value is not None:
-                value = ASFUnicodeAttribute(value=value)
-                asf._tags.setdefault(self.GUID, []).append((key, value))
-
-    def render(self, asf):
-        def render_text(name):
-            value = asf.to_content_description.get(name)
-            if value is not None:
-                return text_type(value).encode("utf-16-le") + b"\x00\x00"
-            else:
-                return b""
-
-        texts = [render_text(x) for x in self.NAMES]
-        data = struct.pack("<HHHHH", *map(len, texts)) + b"".join(texts)
-        return self.GUID + struct.pack("<Q", 24 + len(data)) + data
-
-
-class ExtendedContentDescriptionObject(BaseObject):
-    """Extended content description."""
-    GUID = b"\x40\xA4\xD0\xD2\x07\xE3\xD2\x11\x97\xF0\x00\xA0\xC9\x5E\xA8\x50"
-
-    def parse(self, asf, data, fileobj, size):
-        super(ExtendedContentDescriptionObject, self).parse(
-            asf, data, fileobj, size)
-        asf.extended_content_description_obj = self
-        num_attributes, = struct.unpack("<H", data[0:2])
-        pos = 2
-        for i in xrange(num_attributes):
-            name_length, = struct.unpack("<H", data[pos:pos + 2])
-            pos += 2
-            name = data[pos:pos + name_length]
-            name = name.decode("utf-16-le").strip("\x00")
-            pos += name_length
-            value_type, value_length = struct.unpack("<HH", data[pos:pos + 4])
-            pos += 4
-            value = data[pos:pos + value_length]
-            pos += value_length
-            attr = _attribute_types[value_type](data=value)
-            asf._tags.setdefault(self.GUID, []).append((name, attr))
-
-    def render(self, asf):
-        attrs = asf.to_extended_content_description.items()
-        data = b"".join(attr.render(name) for (name, attr) in attrs)
-        data = struct.pack("<QH", 26 + len(data), len(attrs)) + data
-        return self.GUID + data
-
-
-class FilePropertiesObject(BaseObject):
-    """File properties."""
-    GUID = b"\xA1\xDC\xAB\x8C\x47\xA9\xCF\x11\x8E\xE4\x00\xC0\x0C\x20\x53\x65"
-
-    def parse(self, asf, data, fileobj, size):
-        super(FilePropertiesObject, self).parse(asf, data, fileobj, size)
-        length, _, preroll = struct.unpack("<QQQ", data[40:64])
-        asf.info.length = (length / 10000000.0) - (preroll / 1000.0)
-
-
-class StreamPropertiesObject(BaseObject):
-    """Stream properties."""
-    GUID = b"\x91\x07\xDC\xB7\xB7\xA9\xCF\x11\x8E\xE6\x00\xC0\x0C\x20\x53\x65"
-
-    def parse(self, asf, data, fileobj, size):
-        super(StreamPropertiesObject, self).parse(asf, data, fileobj, size)
-        channels, sample_rate, bitrate = struct.unpack("<HII", data[56:66])
-        asf.info.channels = channels
-        asf.info.sample_rate = sample_rate
-        asf.info.bitrate = bitrate * 8
-
-
-class HeaderExtensionObject(BaseObject):
-    """Header extension."""
-    GUID = b"\xb5\x03\xbf_.\xa9\xcf\x11\x8e\xe3\x00\xc0\x0c Se"
-
-    def parse(self, asf, data, fileobj, size):
-        super(HeaderExtensionObject, self).parse(asf, data, fileobj, size)
-        asf.header_extension_obj = self
-        datasize, = struct.unpack("<I", data[18:22])
-        datapos = 0
-        self.objects = []
-        while datapos < datasize:
-            guid, size = struct.unpack(
-                "<16sQ", data[22 + datapos:22 + datapos + 24])
-            if guid in _object_types:
-                obj = _object_types[guid]()
-            else:
-                obj = UnknownObject(guid)
-            obj.parse(asf, data[22 + datapos + 24:22 + datapos + size],
-                      fileobj, size)
-            self.objects.append(obj)
-            datapos += size
-
-    def render(self, asf):
-        data = b"".join(obj.render(asf) for obj in self.objects)
-        return (self.GUID + struct.pack("<Q", 24 + 16 + 6 + len(data)) +
-                b"\x11\xD2\xD3\xAB\xBA\xA9\xcf\x11" +
-                b"\x8E\xE6\x00\xC0\x0C\x20\x53\x65" +
-                b"\x06\x00" + struct.pack("<I", len(data)) + data)
-
-
-class MetadataObject(BaseObject):
-    """Metadata description."""
-    GUID = b"\xea\xcb\xf8\xc5\xaf[wH\x84g\xaa\x8cD\xfaL\xca"
-
-    def parse(self, asf, data, fileobj, size):
-        super(MetadataObject, self).parse(asf, data, fileobj, size)
-        asf.metadata_obj = self
-        num_attributes, = struct.unpack("<H", data[0:2])
-        pos = 2
-        for i in xrange(num_attributes):
-            (reserved, stream, name_length, value_type,
-             value_length) = struct.unpack("<HHHHI", data[pos:pos + 12])
-            pos += 12
-            name = data[pos:pos + name_length]
-            name = name.decode("utf-16-le").strip("\x00")
-            pos += name_length
-            value = data[pos:pos + value_length]
-            pos += value_length
-            args = {'data': value, 'stream': stream}
-            if value_type == 2:
-                args['dword'] = False
-            attr = _attribute_types[value_type](**args)
-            asf._tags.setdefault(self.GUID, []).append((name, attr))
-
-    def render(self, asf):
-        attrs = asf.to_metadata.items()
-        data = b"".join([attr.render_m(name) for (name, attr) in attrs])
-        return (self.GUID + struct.pack("<QH", 26 + len(data), len(attrs)) +
-                data)
-
-
-class MetadataLibraryObject(BaseObject):
-    """Metadata library description."""
-    GUID = b"\x94\x1c#D\x98\x94\xd1I\xa1A\x1d\x13NEpT"
-
-    def parse(self, asf, data, fileobj, size):
-        super(MetadataLibraryObject, self).parse(asf, data, fileobj, size)
-        asf.metadata_library_obj = self
-        num_attributes, = struct.unpack("<H", data[0:2])
-        pos = 2
-        for i in xrange(num_attributes):
-            (language, stream, name_length, value_type,
-             value_length) = struct.unpack("<HHHHI", data[pos:pos + 12])
-            pos += 12
-            name = data[pos:pos + name_length]
-            name = name.decode("utf-16-le").strip("\x00")
-            pos += name_length
-            value = data[pos:pos + value_length]
-            pos += value_length
-            args = {'data': value, 'language': language, 'stream': stream}
-            if value_type == 2:
-                args['dword'] = False
-            attr = _attribute_types[value_type](**args)
-            asf._tags.setdefault(self.GUID, []).append((name, attr))
-
-    def render(self, asf):
-        attrs = asf.to_metadata_library
-        data = b"".join([attr.render_ml(name) for (name, attr) in attrs])
-        return (self.GUID + struct.pack("<QH", 26 + len(data), len(attrs)) +
-                data)
-
-
-_object_types = {
-    ExtendedContentDescriptionObject.GUID: ExtendedContentDescriptionObject,
-    ContentDescriptionObject.GUID: ContentDescriptionObject,
-    FilePropertiesObject.GUID: FilePropertiesObject,
-    StreamPropertiesObject.GUID: StreamPropertiesObject,
-    HeaderExtensionObject.GUID: HeaderExtensionObject,
-    MetadataLibraryObject.GUID: MetadataLibraryObject,
-    MetadataObject.GUID: MetadataObject,
-}
-
-
-class ASF(FileType):
-    """An ASF file, probably containing WMA or WMV."""
-
-    _mimes = ["audio/x-ms-wma", "audio/x-ms-wmv", "video/x-ms-asf",
-              "audio/x-wma", "video/x-wmv"]
-
-    def load(self, filename):
-        self.filename = filename
-        with open(filename, "rb") as fileobj:
-            self.size = 0
-            self.size1 = 0
-            self.size2 = 0
-            self.offset1 = 0
-            self.offset2 = 0
-            self.num_objects = 0
-            self.info = ASFInfo()
-            self.tags = ASFTags()
-            self.__read_file(fileobj)
-
-    def save(self):
-        # Move attributes to the right objects
-        self.to_content_description = {}
-        self.to_extended_content_description = {}
-        self.to_metadata = {}
-        self.to_metadata_library = []
-        for name, value in self.tags:
-            library_only = (value.data_size() > 0xFFFF or value.TYPE == GUID)
-            can_cont_desc = value.TYPE == UNICODE
-
-            if library_only or value.language is not None:
-                self.to_metadata_library.append((name, value))
-            elif value.stream is not None:
-                if name not in self.to_metadata:
-                    self.to_metadata[name] = value
-                else:
-                    self.to_metadata_library.append((name, value))
-            elif name in ContentDescriptionObject.NAMES:
-                if name not in self.to_content_description and can_cont_desc:
-                    self.to_content_description[name] = value
-                else:
-                    self.to_metadata_library.append((name, value))
-            else:
-                if name not in self.to_extended_content_description:
-                    self.to_extended_content_description[name] = value
-                else:
-                    self.to_metadata_library.append((name, value))
-
-        # Add missing objects
-        if not self.content_description_obj:
-            self.content_description_obj = \
-                ContentDescriptionObject()
-            self.objects.append(self.content_description_obj)
-        if not self.extended_content_description_obj:
-            self.extended_content_description_obj = \
-                ExtendedContentDescriptionObject()
-            self.objects.append(self.extended_content_description_obj)
-        if not self.header_extension_obj:
-            self.header_extension_obj = \
-                HeaderExtensionObject()
-            self.objects.append(self.header_extension_obj)
-        if not self.metadata_obj:
-            self.metadata_obj = \
-                MetadataObject()
-            self.header_extension_obj.objects.append(self.metadata_obj)
-        if not self.metadata_library_obj:
-            self.metadata_library_obj = \
-                MetadataLibraryObject()
-            self.header_extension_obj.objects.append(self.metadata_library_obj)
-
-        # Render the header
-        data = b"".join([obj.render(self) for obj in self.objects])
-        data = (HeaderObject.GUID +
-                struct.pack("<QL", len(data) + 30, len(self.objects)) +
-                b"\x01\x02" + data)
-
-        with open(self.filename, "rb+") as fileobj:
-            size = len(data)
-            if size > self.size:
-                insert_bytes(fileobj, size - self.size, self.size)
-            if size < self.size:
-                delete_bytes(fileobj, self.size - size, 0)
-            fileobj.seek(0)
-            fileobj.write(data)
-
-        self.size = size
-        self.num_objects = len(self.objects)
-
-    def __read_file(self, fileobj):
-        header = fileobj.read(30)
-        if len(header) != 30 or header[:16] != HeaderObject.GUID:
-            raise ASFHeaderError("Not an ASF file.")
-
-        self.extended_content_description_obj = None
-        self.content_description_obj = None
-        self.header_extension_obj = None
-        self.metadata_obj = None
-        self.metadata_library_obj = None
-
-        self.size, self.num_objects = struct.unpack("<QL", header[16:28])
-        self.objects = []
-        self._tags = {}
-        for i in xrange(self.num_objects):
-            self.__read_object(fileobj)
-
-        for guid in [ContentDescriptionObject.GUID,
-                ExtendedContentDescriptionObject.GUID, MetadataObject.GUID,
-                MetadataLibraryObject.GUID]:
-            self.tags.extend(self._tags.pop(guid, []))
-        assert not self._tags
-
-    def __read_object(self, fileobj):
-        guid, size = struct.unpack("<16sQ", fileobj.read(24))
-        if guid in _object_types:
-            obj = _object_types[guid]()
-        else:
-            obj = UnknownObject(guid)
-        data = fileobj.read(size - 24)
-        obj.parse(self, data, fileobj, size)
-        self.objects.append(obj)
-
-    @staticmethod
-    def score(filename, fileobj, header):
-        return header.startswith(HeaderObject.GUID) * 2
-
-Open = ASF
@@ -0,0 +1,338 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005-2006  Joe Wreschnig
+# Copyright (C) 2006-2007  Lukas Lalinsky
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""Read and write ASF (Window Media Audio) files."""
+
+__all__ = ["ASF", "Open"]
+
+from mutagen import FileType, Tags, StreamInfo
+from mutagen._util import resize_bytes, DictMixin, loadfile, convert_error
+from mutagen._compat import string_types, long_, PY3, izip
+
+from ._util import error, ASFError, ASFHeaderError
+from ._objects import HeaderObject, MetadataLibraryObject, MetadataObject, \
+    ExtendedContentDescriptionObject, HeaderExtensionObject, \
+    ContentDescriptionObject
+from ._attrs import ASFGUIDAttribute, ASFWordAttribute, ASFQWordAttribute, \
+    ASFDWordAttribute, ASFBoolAttribute, ASFByteArrayAttribute, \
+    ASFUnicodeAttribute, ASFBaseAttribute, ASFValue
+
+
+# pyflakes
+error, ASFError, ASFHeaderError, ASFValue
+
+
+class ASFInfo(StreamInfo):
+    """ASFInfo()
+
+    ASF stream information.
+
+    Attributes:
+        length (`float`): "Length in seconds
+        sample_rate (`int`): Sample rate in Hz
+        bitrate (`int`): Bitrate in bps
+        channels (`int`): Number of channels
+        codec_type (`mutagen.text`): Name of the codec type of the first
+            audio stream or an empty string if unknown. Example:
+            ``Windows Media Audio 9 Standard``
+        codec_name (`mutagen.text`): Name and maybe version of the codec used.
+            Example: ``Windows Media Audio 9.1``
+        codec_description (`mutagen.text`): Further information on the codec
+            used. Example: ``64 kbps, 48 kHz, stereo 2-pass CBR``
+    """
+
+    length = 0.0
+    sample_rate = 0
+    bitrate = 0
+    channels = 0
+    codec_type = u""
+    codec_name = u""
+    codec_description = u""
+
+    def __init__(self):
+        self.length = 0.0
+        self.sample_rate = 0
+        self.bitrate = 0
+        self.channels = 0
+        self.codec_type = u""
+        self.codec_name = u""
+        self.codec_description = u""
+
+    def pprint(self):
+        """Returns:
+            text: a stream information text summary
+        """
+
+        s = u"ASF (%s) %d bps, %s Hz, %d channels, %.2f seconds" % (
+            self.codec_type or self.codec_name or u"???", self.bitrate,
+            self.sample_rate, self.channels, self.length)
+        return s
+
+
+class ASFTags(list, DictMixin, Tags):
+    """ASFTags()
+
+    Dictionary containing ASF attributes.
+    """
+
+    def __getitem__(self, key):
+        """A list of values for the key.
+
+        This is a copy, so comment['title'].append('a title') will not
+        work.
+
+        """
+
+        # PY3 only
+        if isinstance(key, slice):
+            return list.__getitem__(self, key)
+
+        values = [value for (k, value) in self if k == key]
+        if not values:
+            raise KeyError(key)
+        else:
+            return values
+
+    def __delitem__(self, key):
+        """Delete all values associated with the key."""
+
+        # PY3 only
+        if isinstance(key, slice):
+            return list.__delitem__(self, key)
+
+        to_delete = [x for x in self if x[0] == key]
+        if not to_delete:
+            raise KeyError(key)
+        else:
+            for k in to_delete:
+                self.remove(k)
+
+    def __contains__(self, key):
+        """Return true if the key has any values."""
+        for k, value in self:
+            if k == key:
+                return True
+        else:
+            return False
+
+    def __setitem__(self, key, values):
+        """Set a key's value or values.
+
+        Setting a value overwrites all old ones. The value may be a
+        list of Unicode or UTF-8 strings, or a single Unicode or UTF-8
+        string.
+        """
+
+        # PY3 only
+        if isinstance(key, slice):
+            return list.__setitem__(self, key, values)
+
+        if not isinstance(values, list):
+            values = [values]
+
+        to_append = []
+        for value in values:
+            if not isinstance(value, ASFBaseAttribute):
+                if isinstance(value, string_types):
+                    value = ASFUnicodeAttribute(value)
+                elif PY3 and isinstance(value, bytes):
+                    value = ASFByteArrayAttribute(value)
+                elif isinstance(value, bool):
+                    value = ASFBoolAttribute(value)
+                elif isinstance(value, int):
+                    value = ASFDWordAttribute(value)
+                elif isinstance(value, long_):
+                    value = ASFQWordAttribute(value)
+                else:
+                    raise TypeError("Invalid type %r" % type(value))
+            to_append.append((key, value))
+
+        try:
+            del(self[key])
+        except KeyError:
+            pass
+
+        self.extend(to_append)
+
+    def keys(self):
+        """Return a sequence of all keys in the comment."""
+
+        return self and set(next(izip(*self)))
+
+    def as_dict(self):
+        """Return a copy of the comment data in a real dict."""
+
+        d = {}
+        for key, value in self:
+            d.setdefault(key, []).append(value)
+        return d
+
+    def pprint(self):
+        """Returns a string containing all key, value pairs.
+
+        :rtype: text
+        """
+
+        return "\n".join("%s=%s" % (k, v) for k, v in self)
+
+
+UNICODE = ASFUnicodeAttribute.TYPE
+"""Unicode string type"""
+
+BYTEARRAY = ASFByteArrayAttribute.TYPE
+"""Byte array type"""
+
+BOOL = ASFBoolAttribute.TYPE
+"""Bool type"""
+
+DWORD = ASFDWordAttribute.TYPE
+""""DWord type (uint32)"""
+
+QWORD = ASFQWordAttribute.TYPE
+"""QWord type (uint64)"""
+
+WORD = ASFWordAttribute.TYPE
+"""Word type (uint16)"""
+
+GUID = ASFGUIDAttribute.TYPE
+"""GUID type"""
+
+
+class ASF(FileType):
+    """ASF(filething)
+
+    An ASF file, probably containing WMA or WMV.
+
+    Arguments:
+        filething (filething)
+
+    Attributes:
+        info (`ASFInfo`)
+        tags (`ASFTags`)
+    """
+
+    _mimes = ["audio/x-ms-wma", "audio/x-ms-wmv", "video/x-ms-asf",
+              "audio/x-wma", "video/x-wmv"]
+
+    info = None
+    tags = None
+
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething):
+        """load(filething)
+
+        Args:
+            filething (filething)
+        Raises:
+            mutagen.MutagenError
+        """
+
+        fileobj = filething.fileobj
+
+        self.info = ASFInfo()
+        self.tags = ASFTags()
+
+        self._tags = {}
+        self._header = HeaderObject.parse_full(self, fileobj)
+
+        for guid in [ContentDescriptionObject.GUID,
+                     ExtendedContentDescriptionObject.GUID,
+                     MetadataObject.GUID,
+                     MetadataLibraryObject.GUID]:
+            self.tags.extend(self._tags.pop(guid, []))
+
+        assert not self._tags
+
+    @convert_error(IOError, error)
+    @loadfile(writable=True)
+    def save(self, filething, padding=None):
+        """save(filething=None, padding=None)
+
+        Save tag changes back to the loaded file.
+
+        Args:
+            filething (filething)
+            padding (PaddingFunction)
+        Raises:
+            mutagen.MutagenError
+        """
+
+        # Move attributes to the right objects
+        self.to_content_description = {}
+        self.to_extended_content_description = {}
+        self.to_metadata = {}
+        self.to_metadata_library = []
+        for name, value in self.tags:
+            library_only = (value.data_size() > 0xFFFF or value.TYPE == GUID)
+            can_cont_desc = value.TYPE == UNICODE
+
+            if library_only or value.language is not None:
+                self.to_metadata_library.append((name, value))
+            elif value.stream is not None:
+                if name not in self.to_metadata:
+                    self.to_metadata[name] = value
+                else:
+                    self.to_metadata_library.append((name, value))
+            elif name in ContentDescriptionObject.NAMES:
+                if name not in self.to_content_description and can_cont_desc:
+                    self.to_content_description[name] = value
+                else:
+                    self.to_metadata_library.append((name, value))
+            else:
+                if name not in self.to_extended_content_description:
+                    self.to_extended_content_description[name] = value
+                else:
+                    self.to_metadata_library.append((name, value))
+
+        # Add missing objects
+        header = self._header
+        if header.get_child(ContentDescriptionObject.GUID) is None:
+            header.objects.append(ContentDescriptionObject())
+        if header.get_child(ExtendedContentDescriptionObject.GUID) is None:
+            header.objects.append(ExtendedContentDescriptionObject())
+        header_ext = header.get_child(HeaderExtensionObject.GUID)
+        if header_ext is None:
+            header_ext = HeaderExtensionObject()
+            header.objects.append(header_ext)
+        if header_ext.get_child(MetadataObject.GUID) is None:
+            header_ext.objects.append(MetadataObject())
+        if header_ext.get_child(MetadataLibraryObject.GUID) is None:
+            header_ext.objects.append(MetadataLibraryObject())
+
+        fileobj = filething.fileobj
+        # Render to file
+        old_size = header.parse_size(fileobj)[0]
+        data = header.render_full(self, fileobj, old_size, padding)
+        size = len(data)
+        resize_bytes(fileobj, old_size, size, 0)
+        fileobj.seek(0)
+        fileobj.write(data)
+
+    def add_tags(self):
+        raise ASFError
+
+    @loadfile(writable=True)
+    def delete(self, filething):
+        """delete(filething=None)
+
+        Args:
+            filething (filething)
+        Raises:
+            mutagen.MutagenError
+        """
+
+        self.tags.clear()
+        self.save(filething, padding=lambda x: 0)
+
+    @staticmethod
+    def score(filename, fileobj, header):
+        return header.startswith(HeaderObject.GUID) * 2
+
+Open = ASF
@@ -0,0 +1,439 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005-2006  Joe Wreschnig
+# Copyright (C) 2006-2007  Lukas Lalinsky
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import sys
+import struct
+
+from mutagen._compat import swap_to_string, text_type, PY2, reraise
+from mutagen._util import total_ordering
+
+from ._util import ASFError
+
+
+class ASFBaseAttribute(object):
+    """Generic attribute."""
+
+    TYPE = None
+
+    _TYPES = {}
+
+    value = None
+    """The Python value of this attribute (type depends on the class)"""
+
+    language = None
+    """Language"""
+
+    stream = None
+    """Stream"""
+
+    def __init__(self, value=None, data=None, language=None,
+                 stream=None, **kwargs):
+        self.language = language
+        self.stream = stream
+        if data:
+            self.value = self.parse(data, **kwargs)
+        else:
+            if value is None:
+                # we used to support not passing any args and instead assign
+                # them later, keep that working..
+                self.value = None
+            else:
+                self.value = self._validate(value)
+
+    @classmethod
+    def _register(cls, other):
+        cls._TYPES[other.TYPE] = other
+        return other
+
+    @classmethod
+    def _get_type(cls, type_):
+        """Raises KeyError"""
+
+        return cls._TYPES[type_]
+
+    def _validate(self, value):
+        """Raises TypeError or ValueError in case the user supplied value
+        isn't valid.
+        """
+
+        return value
+
+    def data_size(self):
+        raise NotImplementedError
+
+    def __repr__(self):
+        name = "%s(%r" % (type(self).__name__, self.value)
+        if self.language:
+            name += ", language=%d" % self.language
+        if self.stream:
+            name += ", stream=%d" % self.stream
+        name += ")"
+        return name
+
+    def render(self, name):
+        name = name.encode("utf-16-le") + b"\x00\x00"
+        data = self._render()
+        return (struct.pack("<H", len(name)) + name +
+                struct.pack("<HH", self.TYPE, len(data)) + data)
+
+    def render_m(self, name):
+        name = name.encode("utf-16-le") + b"\x00\x00"
+        if self.TYPE == 2:
+            data = self._render(dword=False)
+        else:
+            data = self._render()
+        return (struct.pack("<HHHHI", 0, self.stream or 0, len(name),
+                            self.TYPE, len(data)) + name + data)
+
+    def render_ml(self, name):
+        name = name.encode("utf-16-le") + b"\x00\x00"
+        if self.TYPE == 2:
+            data = self._render(dword=False)
+        else:
+            data = self._render()
+
+        return (struct.pack("<HHHHI", self.language or 0, self.stream or 0,
+                            len(name), self.TYPE, len(data)) + name + data)
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFUnicodeAttribute(ASFBaseAttribute):
+    """Unicode string attribute.
+
+    ::
+
+        ASFUnicodeAttribute(u'some text')
+    """
+
+    TYPE = 0x0000
+
+    def parse(self, data):
+        try:
+            return data.decode("utf-16-le").strip("\x00")
+        except UnicodeDecodeError as e:
+            reraise(ASFError, e, sys.exc_info()[2])
+
+    def _validate(self, value):
+        if not isinstance(value, text_type):
+            if PY2:
+                return value.decode("utf-8")
+            else:
+                raise TypeError("%r not str" % value)
+        return value
+
+    def _render(self):
+        return self.value.encode("utf-16-le") + b"\x00\x00"
+
+    def data_size(self):
+        return len(self._render())
+
+    def __bytes__(self):
+        return self.value.encode("utf-16-le")
+
+    def __str__(self):
+        return self.value
+
+    def __eq__(self, other):
+        return text_type(self) == other
+
+    def __lt__(self, other):
+        return text_type(self) < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFByteArrayAttribute(ASFBaseAttribute):
+    """Byte array attribute.
+
+    ::
+
+        ASFByteArrayAttribute(b'1234')
+    """
+    TYPE = 0x0001
+
+    def parse(self, data):
+        assert isinstance(data, bytes)
+        return data
+
+    def _render(self):
+        assert isinstance(self.value, bytes)
+        return self.value
+
+    def _validate(self, value):
+        if not isinstance(value, bytes):
+            raise TypeError("must be bytes/str: %r" % value)
+        return value
+
+    def data_size(self):
+        return len(self.value)
+
+    def __bytes__(self):
+        return self.value
+
+    def __str__(self):
+        return "[binary data (%d bytes)]" % len(self.value)
+
+    def __eq__(self, other):
+        return self.value == other
+
+    def __lt__(self, other):
+        return self.value < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFBoolAttribute(ASFBaseAttribute):
+    """Bool attribute.
+
+    ::
+
+        ASFBoolAttribute(True)
+    """
+
+    TYPE = 0x0002
+
+    def parse(self, data, dword=True):
+        if dword:
+            return struct.unpack("<I", data)[0] == 1
+        else:
+            return struct.unpack("<H", data)[0] == 1
+
+    def _render(self, dword=True):
+        if dword:
+            return struct.pack("<I", bool(self.value))
+        else:
+            return struct.pack("<H", bool(self.value))
+
+    def _validate(self, value):
+        return bool(value)
+
+    def data_size(self):
+        return 4
+
+    def __bool__(self):
+        return bool(self.value)
+
+    def __bytes__(self):
+        return text_type(self.value).encode('utf-8')
+
+    def __str__(self):
+        return text_type(self.value)
+
+    def __eq__(self, other):
+        return bool(self.value) == other
+
+    def __lt__(self, other):
+        return bool(self.value) < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFDWordAttribute(ASFBaseAttribute):
+    """DWORD attribute.
+
+    ::
+
+        ASFDWordAttribute(42)
+    """
+
+    TYPE = 0x0003
+
+    def parse(self, data):
+        return struct.unpack("<L", data)[0]
+
+    def _render(self):
+        return struct.pack("<L", self.value)
+
+    def _validate(self, value):
+        value = int(value)
+        if not 0 <= value <= 2 ** 32 - 1:
+            raise ValueError("Out of range")
+        return value
+
+    def data_size(self):
+        return 4
+
+    def __int__(self):
+        return self.value
+
+    def __bytes__(self):
+        return text_type(self.value).encode('utf-8')
+
+    def __str__(self):
+        return text_type(self.value)
+
+    def __eq__(self, other):
+        return int(self.value) == other
+
+    def __lt__(self, other):
+        return int(self.value) < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFQWordAttribute(ASFBaseAttribute):
+    """QWORD attribute.
+
+    ::
+
+        ASFQWordAttribute(42)
+    """
+
+    TYPE = 0x0004
+
+    def parse(self, data):
+        return struct.unpack("<Q", data)[0]
+
+    def _render(self):
+        return struct.pack("<Q", self.value)
+
+    def _validate(self, value):
+        value = int(value)
+        if not 0 <= value <= 2 ** 64 - 1:
+            raise ValueError("Out of range")
+        return value
+
+    def data_size(self):
+        return 8
+
+    def __int__(self):
+        return self.value
+
+    def __bytes__(self):
+        return text_type(self.value).encode('utf-8')
+
+    def __str__(self):
+        return text_type(self.value)
+
+    def __eq__(self, other):
+        return int(self.value) == other
+
+    def __lt__(self, other):
+        return int(self.value) < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFWordAttribute(ASFBaseAttribute):
+    """WORD attribute.
+
+    ::
+
+        ASFWordAttribute(42)
+    """
+
+    TYPE = 0x0005
+
+    def parse(self, data):
+        return struct.unpack("<H", data)[0]
+
+    def _render(self):
+        return struct.pack("<H", self.value)
+
+    def _validate(self, value):
+        value = int(value)
+        if not 0 <= value <= 2 ** 16 - 1:
+            raise ValueError("Out of range")
+        return value
+
+    def data_size(self):
+        return 2
+
+    def __int__(self):
+        return self.value
+
+    def __bytes__(self):
+        return text_type(self.value).encode('utf-8')
+
+    def __str__(self):
+        return text_type(self.value)
+
+    def __eq__(self, other):
+        return int(self.value) == other
+
+    def __lt__(self, other):
+        return int(self.value) < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+@ASFBaseAttribute._register
+@swap_to_string
+@total_ordering
+class ASFGUIDAttribute(ASFBaseAttribute):
+    """GUID attribute."""
+
+    TYPE = 0x0006
+
+    def parse(self, data):
+        assert isinstance(data, bytes)
+        return data
+
+    def _render(self):
+        assert isinstance(self.value, bytes)
+        return self.value
+
+    def _validate(self, value):
+        if not isinstance(value, bytes):
+            raise TypeError("must be bytes/str: %r" % value)
+        return value
+
+    def data_size(self):
+        return len(self.value)
+
+    def __bytes__(self):
+        return self.value
+
+    def __str__(self):
+        return repr(self.value)
+
+    def __eq__(self, other):
+        return self.value == other
+
+    def __lt__(self, other):
+        return self.value < other
+
+    __hash__ = ASFBaseAttribute.__hash__
+
+
+def ASFValue(value, kind, **kwargs):
+    """Create a tag value of a specific kind.
+
+    ::
+
+        ASFValue(u"My Value", UNICODE)
+
+    :rtype: ASFBaseAttribute
+    :raises TypeError: in case a wrong type was passed
+    :raises ValueError: in case the value can't be be represented as ASFValue.
+    """
+
+    try:
+        attr_type = ASFBaseAttribute._get_type(kind)
+    except KeyError:
+        raise ValueError("Unknown value type %r" % kind)
+    else:
+        return attr_type(value=value, **kwargs)
@@ -0,0 +1,461 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005-2006  Joe Wreschnig
+# Copyright (C) 2006-2007  Lukas Lalinsky
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import struct
+
+from mutagen._util import cdata, get_size
+from mutagen._compat import text_type, xrange, izip
+from mutagen._tags import PaddingInfo
+
+from ._util import guid2bytes, bytes2guid, CODECS, ASFError, ASFHeaderError
+from ._attrs import ASFBaseAttribute, ASFUnicodeAttribute
+
+
+class BaseObject(object):
+    """Base ASF object."""
+
+    GUID = None
+    _TYPES = {}
+
+    def __init__(self):
+        self.objects = []
+        self.data = b""
+
+    def parse(self, asf, data):
+        self.data = data
+
+    def render(self, asf):
+        data = self.GUID + struct.pack("<Q", len(self.data) + 24) + self.data
+        return data
+
+    def get_child(self, guid):
+        for obj in self.objects:
+            if obj.GUID == guid:
+                return obj
+        return None
+
+    @classmethod
+    def _register(cls, other):
+        cls._TYPES[other.GUID] = other
+        return other
+
+    @classmethod
+    def _get_object(cls, guid):
+        if guid in cls._TYPES:
+            return cls._TYPES[guid]()
+        else:
+            return UnknownObject(guid)
+
+    def __repr__(self):
+        return "<%s GUID=%s objects=%r>" % (
+            type(self).__name__, bytes2guid(self.GUID), self.objects)
+
+    def pprint(self):
+        l = []
+        l.append("%s(%s)" % (type(self).__name__, bytes2guid(self.GUID)))
+        for o in self.objects:
+            for e in o.pprint().splitlines():
+                l.append("  " + e)
+        return "\n".join(l)
+
+
+class UnknownObject(BaseObject):
+    """Unknown ASF object."""
+
+    def __init__(self, guid):
+        super(UnknownObject, self).__init__()
+        assert isinstance(guid, bytes)
+        self.GUID = guid
+
+
+@BaseObject._register
+class HeaderObject(BaseObject):
+    """ASF header."""
+
+    GUID = guid2bytes("75B22630-668E-11CF-A6D9-00AA0062CE6C")
+
+    @classmethod
+    def parse_full(cls, asf, fileobj):
+        """Raises ASFHeaderError"""
+
+        header = cls()
+
+        remaining_header, num_objects = cls.parse_size(fileobj)
+        remaining_header -= 30
+
+        for i in xrange(num_objects):
+            obj_header_size = 24
+            if remaining_header < obj_header_size:
+                raise ASFHeaderError("invalid header size")
+            data = fileobj.read(obj_header_size)
+            if len(data) != obj_header_size:
+                raise ASFHeaderError("truncated")
+            remaining_header -= obj_header_size
+
+            guid, size = struct.unpack("<16sQ", data)
+            obj = BaseObject._get_object(guid)
+
+            payload_size = size - obj_header_size
+            if remaining_header < payload_size:
+                raise ASFHeaderError("invalid object size")
+            remaining_header -= payload_size
+
+            try:
+                data = fileobj.read(payload_size)
+            except OverflowError:
+                # read doesn't take 64bit values
+                raise ASFHeaderError("invalid header size")
+            if len(data) != payload_size:
+                raise ASFHeaderError("truncated")
+
+            obj.parse(asf, data)
+            header.objects.append(obj)
+
+        return header
+
+    @classmethod
+    def parse_size(cls, fileobj):
+        """Returns (size, num_objects)
+
+        Raises ASFHeaderError
+        """
+
+        header = fileobj.read(30)
+        if len(header) != 30 or header[:16] != HeaderObject.GUID:
+            raise ASFHeaderError("Not an ASF file.")
+
+        return struct.unpack("<QL", header[16:28])
+
+    def render_full(self, asf, fileobj, available, padding_func):
+        # Render everything except padding
+        num_objects = 0
+        data = bytearray()
+        for obj in self.objects:
+            if obj.GUID == PaddingObject.GUID:
+                continue
+            data += obj.render(asf)
+            num_objects += 1
+
+        # calculate how much space we need at least
+        padding_obj = PaddingObject()
+        header_size = len(HeaderObject.GUID) + 14
+        padding_overhead = len(padding_obj.render(asf))
+        needed_size = len(data) + header_size + padding_overhead
+
+        # ask the user for padding adjustments
+        file_size = get_size(fileobj)
+        content_size = file_size - available
+        assert content_size >= 0
+        info = PaddingInfo(available - needed_size, content_size)
+
+        # add padding
+        padding = info._get_padding(padding_func)
+        padding_obj.parse(asf, b"\x00" * padding)
+        data += padding_obj.render(asf)
+        num_objects += 1
+
+        data = (HeaderObject.GUID +
+                struct.pack("<QL", len(data) + 30, num_objects) +
+                b"\x01\x02" + data)
+
+        return data
+
+    def parse(self, asf, data):
+        raise NotImplementedError
+
+    def render(self, asf):
+        raise NotImplementedError
+
+
+@BaseObject._register
+class ContentDescriptionObject(BaseObject):
+    """Content description."""
+
+    GUID = guid2bytes("75B22633-668E-11CF-A6D9-00AA0062CE6C")
+
+    NAMES = [
+        u"Title",
+        u"Author",
+        u"Copyright",
+        u"Description",
+        u"Rating",
+    ]
+
+    def parse(self, asf, data):
+        super(ContentDescriptionObject, self).parse(asf, data)
+        lengths = struct.unpack("<HHHHH", data[:10])
+        texts = []
+        pos = 10
+        for length in lengths:
+            end = pos + length
+            if length > 0:
+                texts.append(data[pos:end].decode("utf-16-le").strip(u"\x00"))
+            else:
+                texts.append(None)
+            pos = end
+
+        for key, value in izip(self.NAMES, texts):
+            if value is not None:
+                value = ASFUnicodeAttribute(value=value)
+                asf._tags.setdefault(self.GUID, []).append((key, value))
+
+    def render(self, asf):
+        def render_text(name):
+            value = asf.to_content_description.get(name)
+            if value is not None:
+                return text_type(value).encode("utf-16-le") + b"\x00\x00"
+            else:
+                return b""
+
+        texts = [render_text(x) for x in self.NAMES]
+        data = struct.pack("<HHHHH", *map(len, texts)) + b"".join(texts)
+        return self.GUID + struct.pack("<Q", 24 + len(data)) + data
+
+
+@BaseObject._register
+class ExtendedContentDescriptionObject(BaseObject):
+    """Extended content description."""
+
+    GUID = guid2bytes("D2D0A440-E307-11D2-97F0-00A0C95EA850")
+
+    def parse(self, asf, data):
+        super(ExtendedContentDescriptionObject, self).parse(asf, data)
+        num_attributes, = struct.unpack("<H", data[0:2])
+        pos = 2
+        for i in xrange(num_attributes):
+            name_length, = struct.unpack("<H", data[pos:pos + 2])
+            pos += 2
+            name = data[pos:pos + name_length]
+            name = name.decode("utf-16-le").strip("\x00")
+            pos += name_length
+            value_type, value_length = struct.unpack("<HH", data[pos:pos + 4])
+            pos += 4
+            value = data[pos:pos + value_length]
+            pos += value_length
+            attr = ASFBaseAttribute._get_type(value_type)(data=value)
+            asf._tags.setdefault(self.GUID, []).append((name, attr))
+
+    def render(self, asf):
+        attrs = asf.to_extended_content_description.items()
+        data = b"".join(attr.render(name) for (name, attr) in attrs)
+        data = struct.pack("<QH", 26 + len(data), len(attrs)) + data
+        return self.GUID + data
+
+
+@BaseObject._register
+class FilePropertiesObject(BaseObject):
+    """File properties."""
+
+    GUID = guid2bytes("8CABDCA1-A947-11CF-8EE4-00C00C205365")
+
+    def parse(self, asf, data):
+        super(FilePropertiesObject, self).parse(asf, data)
+        length, _, preroll = struct.unpack("<QQQ", data[40:64])
+        # there are files where preroll is larger than length, limit to >= 0
+        asf.info.length = max((length / 10000000.0) - (preroll / 1000.0), 0.0)
+
+
+@BaseObject._register
+class StreamPropertiesObject(BaseObject):
+    """Stream properties."""
+
+    GUID = guid2bytes("B7DC0791-A9B7-11CF-8EE6-00C00C205365")
+
+    def parse(self, asf, data):
+        super(StreamPropertiesObject, self).parse(asf, data)
+        channels, sample_rate, bitrate = struct.unpack("<HII", data[56:66])
+        asf.info.channels = channels
+        asf.info.sample_rate = sample_rate
+        asf.info.bitrate = bitrate * 8
+
+
+@BaseObject._register
+class CodecListObject(BaseObject):
+    """Codec List"""
+
+    GUID = guid2bytes("86D15240-311D-11D0-A3A4-00A0C90348F6")
+
+    def _parse_entry(self, data, offset):
+        """can raise cdata.error"""
+
+        type_, offset = cdata.uint16_le_from(data, offset)
+
+        units, offset = cdata.uint16_le_from(data, offset)
+        # utf-16 code units, not characters..
+        next_offset = offset + units * 2
+        try:
+            name = data[offset:next_offset].decode("utf-16-le").strip("\x00")
+        except UnicodeDecodeError:
+            name = u""
+        offset = next_offset
+
+        units, offset = cdata.uint16_le_from(data, offset)
+        next_offset = offset + units * 2
+        try:
+            desc = data[offset:next_offset].decode("utf-16-le").strip("\x00")
+        except UnicodeDecodeError:
+            desc = u""
+        offset = next_offset
+
+        bytes_, offset = cdata.uint16_le_from(data, offset)
+        next_offset = offset + bytes_
+        codec = u""
+        if bytes_ == 2:
+            codec_id = cdata.uint16_le_from(data, offset)[0]
+            if codec_id in CODECS:
+                codec = CODECS[codec_id]
+        offset = next_offset
+
+        return offset, type_, name, desc, codec
+
+    def parse(self, asf, data):
+        super(CodecListObject, self).parse(asf, data)
+
+        offset = 16
+        count, offset = cdata.uint32_le_from(data, offset)
+        for i in xrange(count):
+            try:
+                offset, type_, name, desc, codec = \
+                    self._parse_entry(data, offset)
+            except cdata.error:
+                raise ASFError("invalid codec entry")
+
+            # go with the first audio entry
+            if type_ == 2:
+                name = name.strip()
+                desc = desc.strip()
+                asf.info.codec_type = codec
+                asf.info.codec_name = name
+                asf.info.codec_description = desc
+                return
+
+
+@BaseObject._register
+class PaddingObject(BaseObject):
+    """Padding object"""
+
+    GUID = guid2bytes("1806D474-CADF-4509-A4BA-9AABCB96AAE8")
+
+
+@BaseObject._register
+class StreamBitratePropertiesObject(BaseObject):
+    """Stream bitrate properties"""
+
+    GUID = guid2bytes("7BF875CE-468D-11D1-8D82-006097C9A2B2")
+
+
+@BaseObject._register
+class ContentEncryptionObject(BaseObject):
+    """Content encryption"""
+
+    GUID = guid2bytes("2211B3FB-BD23-11D2-B4B7-00A0C955FC6E")
+
+
+@BaseObject._register
+class ExtendedContentEncryptionObject(BaseObject):
+    """Extended content encryption"""
+
+    GUID = guid2bytes("298AE614-2622-4C17-B935-DAE07EE9289C")
+
+
+@BaseObject._register
+class HeaderExtensionObject(BaseObject):
+    """Header extension."""
+
+    GUID = guid2bytes("5FBF03B5-A92E-11CF-8EE3-00C00C205365")
+
+    def parse(self, asf, data):
+        super(HeaderExtensionObject, self).parse(asf, data)
+        datasize, = struct.unpack("<I", data[18:22])
+        datapos = 0
+        while datapos < datasize:
+            guid, size = struct.unpack(
+                "<16sQ", data[22 + datapos:22 + datapos + 24])
+            obj = BaseObject._get_object(guid)
+            obj.parse(asf, data[22 + datapos + 24:22 + datapos + size])
+            self.objects.append(obj)
+            datapos += size
+
+    def render(self, asf):
+        data = bytearray()
+        for obj in self.objects:
+            # some files have the padding in the extension header, but we
+            # want to add it at the end of the top level header. Just
+            # skip padding at this level.
+            if obj.GUID == PaddingObject.GUID:
+                continue
+            data += obj.render(asf)
+        return (self.GUID + struct.pack("<Q", 24 + 16 + 6 + len(data)) +
+                b"\x11\xD2\xD3\xAB\xBA\xA9\xcf\x11" +
+                b"\x8E\xE6\x00\xC0\x0C\x20\x53\x65" +
+                b"\x06\x00" + struct.pack("<I", len(data)) + data)
+
+
+@BaseObject._register
+class MetadataObject(BaseObject):
+    """Metadata description."""
+
+    GUID = guid2bytes("C5F8CBEA-5BAF-4877-8467-AA8C44FA4CCA")
+
+    def parse(self, asf, data):
+        super(MetadataObject, self).parse(asf, data)
+        num_attributes, = struct.unpack("<H", data[0:2])
+        pos = 2
+        for i in xrange(num_attributes):
+            (reserved, stream, name_length, value_type,
+             value_length) = struct.unpack("<HHHHI", data[pos:pos + 12])
+            pos += 12
+            name = data[pos:pos + name_length]
+            name = name.decode("utf-16-le").strip("\x00")
+            pos += name_length
+            value = data[pos:pos + value_length]
+            pos += value_length
+            args = {'data': value, 'stream': stream}
+            if value_type == 2:
+                args['dword'] = False
+            attr = ASFBaseAttribute._get_type(value_type)(**args)
+            asf._tags.setdefault(self.GUID, []).append((name, attr))
+
+    def render(self, asf):
+        attrs = asf.to_metadata.items()
+        data = b"".join([attr.render_m(name) for (name, attr) in attrs])
+        return (self.GUID + struct.pack("<QH", 26 + len(data), len(attrs)) +
+                data)
+
+
+@BaseObject._register
+class MetadataLibraryObject(BaseObject):
+    """Metadata library description."""
+
+    GUID = guid2bytes("44231C94-9498-49D1-A141-1D134E457054")
+
+    def parse(self, asf, data):
+        super(MetadataLibraryObject, self).parse(asf, data)
+        num_attributes, = struct.unpack("<H", data[0:2])
+        pos = 2
+        for i in xrange(num_attributes):
+            (language, stream, name_length, value_type,
+             value_length) = struct.unpack("<HHHHI", data[pos:pos + 12])
+            pos += 12
+            name = data[pos:pos + name_length]
+            name = name.decode("utf-16-le").strip("\x00")
+            pos += name_length
+            value = data[pos:pos + value_length]
+            pos += value_length
+            args = {'data': value, 'language': language, 'stream': stream}
+            if value_type == 2:
+                args['dword'] = False
+            attr = ASFBaseAttribute._get_type(value_type)(**args)
+            asf._tags.setdefault(self.GUID, []).append((name, attr))
+
+    def render(self, asf):
+        attrs = asf.to_metadata_library
+        data = b"".join([attr.render_ml(name) for (name, attr) in attrs])
+        return (self.GUID + struct.pack("<QH", 26 + len(data), len(attrs)) +
+                data)
@@ -0,0 +1,316 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005-2006  Joe Wreschnig
+# Copyright (C) 2006-2007  Lukas Lalinsky
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import struct
+
+from mutagen._util import MutagenError
+
+
+class error(MutagenError):
+    """Error raised by :mod:`mutagen.asf`"""
+
+
+class ASFError(error):
+    pass
+
+
+class ASFHeaderError(error):
+    pass
+
+
+def guid2bytes(s):
+    """Converts a GUID to the serialized bytes representation"""
+
+    assert isinstance(s, str)
+    assert len(s) == 36
+
+    p = struct.pack
+    return b"".join([
+        p("<IHH", int(s[:8], 16), int(s[9:13], 16), int(s[14:18], 16)),
+        p(">H", int(s[19:23], 16)),
+        p(">Q", int(s[24:], 16))[2:],
+    ])
+
+
+def bytes2guid(s):
+    """Converts a serialized GUID to a text GUID"""
+
+    assert isinstance(s, bytes)
+
+    u = struct.unpack
+    v = []
+    v.extend(u("<IHH", s[:8]))
+    v.extend(u(">HQ", s[8:10] + b"\x00\x00" + s[10:]))
+    return "%08X-%04X-%04X-%04X-%012X" % tuple(v)
+
+
+# Names from http://windows.microsoft.com/en-za/windows7/c00d10d1-[0-9A-F]{1,4}
+CODECS = {
+    0x0000: u"Unknown Wave Format",
+    0x0001: u"Microsoft PCM Format",
+    0x0002: u"Microsoft ADPCM Format",
+    0x0003: u"IEEE Float",
+    0x0004: u"Compaq Computer VSELP",
+    0x0005: u"IBM CVSD",
+    0x0006: u"Microsoft CCITT A-Law",
+    0x0007: u"Microsoft CCITT u-Law",
+    0x0008: u"Microsoft DTS",
+    0x0009: u"Microsoft DRM",
+    0x000A: u"Windows Media Audio 9 Voice",
+    0x000B: u"Windows Media Audio 10 Voice",
+    0x000C: u"OGG Vorbis",
+    0x000D: u"FLAC",
+    0x000E: u"MOT AMR",
+    0x000F: u"Nice Systems IMBE",
+    0x0010: u"OKI ADPCM",
+    0x0011: u"Intel IMA ADPCM",
+    0x0012: u"Videologic MediaSpace ADPCM",
+    0x0013: u"Sierra Semiconductor ADPCM",
+    0x0014: u"Antex Electronics G.723 ADPCM",
+    0x0015: u"DSP Solutions DIGISTD",
+    0x0016: u"DSP Solutions DIGIFIX",
+    0x0017: u"Dialogic OKI ADPCM",
+    0x0018: u"MediaVision ADPCM",
+    0x0019: u"Hewlett-Packard CU codec",
+    0x001A: u"Hewlett-Packard Dynamic Voice",
+    0x0020: u"Yamaha ADPCM",
+    0x0021: u"Speech Compression SONARC",
+    0x0022: u"DSP Group True Speech",
+    0x0023: u"Echo Speech EchoSC1",
+    0x0024: u"Ahead Inc. Audiofile AF36",
+    0x0025: u"Audio Processing Technology APTX",
+    0x0026: u"Ahead Inc. AudioFile AF10",
+    0x0027: u"Aculab Prosody 1612",
+    0x0028: u"Merging Technologies S.A. LRC",
+    0x0030: u"Dolby Labs AC2",
+    0x0031: u"Microsoft GSM 6.10",
+    0x0032: u"Microsoft MSNAudio",
+    0x0033: u"Antex Electronics ADPCME",
+    0x0034: u"Control Resources VQLPC",
+    0x0035: u"DSP Solutions Digireal",
+    0x0036: u"DSP Solutions DigiADPCM",
+    0x0037: u"Control Resources CR10",
+    0x0038: u"Natural MicroSystems VBXADPCM",
+    0x0039: u"Crystal Semiconductor IMA ADPCM",
+    0x003A: u"Echo Speech EchoSC3",
+    0x003B: u"Rockwell ADPCM",
+    0x003C: u"Rockwell DigiTalk",
+    0x003D: u"Xebec Multimedia Solutions",
+    0x0040: u"Antex Electronics G.721 ADPCM",
+    0x0041: u"Antex Electronics G.728 CELP",
+    0x0042: u"Intel G.723",
+    0x0043: u"Intel G.723.1",
+    0x0044: u"Intel G.729 Audio",
+    0x0045: u"Sharp G.726 Audio",
+    0x0050: u"Microsoft MPEG-1",
+    0x0052: u"InSoft RT24",
+    0x0053: u"InSoft PAC",
+    0x0055: u"MP3 - MPEG Layer III",
+    0x0059: u"Lucent G.723",
+    0x0060: u"Cirrus Logic",
+    0x0061: u"ESS Technology ESPCM",
+    0x0062: u"Voxware File-Mode",
+    0x0063: u"Canopus Atrac",
+    0x0064: u"APICOM G.726 ADPCM",
+    0x0065: u"APICOM G.722 ADPCM",
+    0x0066: u"Microsoft DSAT",
+    0x0067: u"Microsoft DSAT Display",
+    0x0069: u"Voxware Byte Aligned",
+    0x0070: u"Voxware AC8",
+    0x0071: u"Voxware AC10",
+    0x0072: u"Voxware AC16",
+    0x0073: u"Voxware AC20",
+    0x0074: u"Voxware RT24 MetaVoice",
+    0x0075: u"Voxware RT29 MetaSound",
+    0x0076: u"Voxware RT29HW",
+    0x0077: u"Voxware VR12",
+    0x0078: u"Voxware VR18",
+    0x0079: u"Voxware TQ40",
+    0x007A: u"Voxware SC3",
+    0x007B: u"Voxware SC3",
+    0x0080: u"Softsound",
+    0x0081: u"Voxware TQ60",
+    0x0082: u"Microsoft MSRT24",
+    0x0083: u"AT&T Labs G.729A",
+    0x0084: u"Motion Pixels MVI MV12",
+    0x0085: u"DataFusion Systems G.726",
+    0x0086: u"DataFusion Systems GSM610",
+    0x0088: u"Iterated Systems ISIAudio",
+    0x0089: u"Onlive",
+    0x008A: u"Multitude FT SX20",
+    0x008B: u"Infocom ITS ACM G.721",
+    0x008C: u"Convedia G.729",
+    0x008D: u"Congruency Audio",
+    0x0091: u"Siemens Business Communications SBC24",
+    0x0092: u"Sonic Foundry Dolby AC3 SPDIF",
+    0x0093: u"MediaSonic G.723",
+    0x0094: u"Aculab Prosody 8KBPS",
+    0x0097: u"ZyXEL ADPCM",
+    0x0098: u"Philips LPCBB",
+    0x0099: u"Studer Professional Audio AG Packed",
+    0x00A0: u"Malden Electronics PHONYTALK",
+    0x00A1: u"Racal Recorder GSM",
+    0x00A2: u"Racal Recorder G720.a",
+    0x00A3: u"Racal Recorder G723.1",
+    0x00A4: u"Racal Recorder Tetra ACELP",
+    0x00B0: u"NEC AAC",
+    0x00FF: u"CoreAAC Audio",
+    0x0100: u"Rhetorex ADPCM",
+    0x0101: u"BeCubed Software IRAT",
+    0x0111: u"Vivo G.723",
+    0x0112: u"Vivo Siren",
+    0x0120: u"Philips CELP",
+    0x0121: u"Philips Grundig",
+    0x0123: u"Digital G.723",
+    0x0125: u"Sanyo ADPCM",
+    0x0130: u"Sipro Lab Telecom ACELP.net",
+    0x0131: u"Sipro Lab Telecom ACELP.4800",
+    0x0132: u"Sipro Lab Telecom ACELP.8V3",
+    0x0133: u"Sipro Lab Telecom ACELP.G.729",
+    0x0134: u"Sipro Lab Telecom ACELP.G.729A",
+    0x0135: u"Sipro Lab Telecom ACELP.KELVIN",
+    0x0136: u"VoiceAge AMR",
+    0x0140: u"Dictaphone G.726 ADPCM",
+    0x0141: u"Dictaphone CELP68",
+    0x0142: u"Dictaphone CELP54",
+    0x0150: u"Qualcomm PUREVOICE",
+    0x0151: u"Qualcomm HALFRATE",
+    0x0155: u"Ring Zero Systems TUBGSM",
+    0x0160: u"Windows Media Audio Standard",
+    0x0161: u"Windows Media Audio 9 Standard",
+    0x0162: u"Windows Media Audio 9 Professional",
+    0x0163: u"Windows Media Audio 9 Lossless",
+    0x0164: u"Windows Media Audio Pro over SPDIF",
+    0x0170: u"Unisys NAP ADPCM",
+    0x0171: u"Unisys NAP ULAW",
+    0x0172: u"Unisys NAP ALAW",
+    0x0173: u"Unisys NAP 16K",
+    0x0174: u"Sycom ACM SYC008",
+    0x0175: u"Sycom ACM SYC701 G725",
+    0x0176: u"Sycom ACM SYC701 CELP54",
+    0x0177: u"Sycom ACM SYC701 CELP68",
+    0x0178: u"Knowledge Adventure ADPCM",
+    0x0180: u"Fraunhofer IIS MPEG-2 AAC",
+    0x0190: u"Digital Theater Systems DTS",
+    0x0200: u"Creative Labs ADPCM",
+    0x0202: u"Creative Labs FastSpeech8",
+    0x0203: u"Creative Labs FastSpeech10",
+    0x0210: u"UHER informatic GmbH ADPCM",
+    0x0215: u"Ulead DV Audio",
+    0x0216: u"Ulead DV Audio",
+    0x0220: u"Quarterdeck",
+    0x0230: u"I-link Worldwide ILINK VC",
+    0x0240: u"Aureal Semiconductor RAW SPORT",
+    0x0249: u"Generic Passthru",
+    0x0250: u"Interactive Products HSX",
+    0x0251: u"Interactive Products RPELP",
+    0x0260: u"Consistent Software CS2",
+    0x0270: u"Sony SCX",
+    0x0271: u"Sony SCY",
+    0x0272: u"Sony ATRAC3",
+    0x0273: u"Sony SPC",
+    0x0280: u"Telum Audio",
+    0x0281: u"Telum IA Audio",
+    0x0285: u"Norcom Voice Systems ADPCM",
+    0x0300: u"Fujitsu TOWNS SND",
+    0x0350: u"Micronas SC4 Speech",
+    0x0351: u"Micronas CELP833",
+    0x0400: u"Brooktree BTV Digital",
+    0x0401: u"Intel Music Coder",
+    0x0402: u"Intel Audio",
+    0x0450: u"QDesign Music",
+    0x0500: u"On2 AVC0 Audio",
+    0x0501: u"On2 AVC1 Audio",
+    0x0680: u"AT&T Labs VME VMPCM",
+    0x0681: u"AT&T Labs TPC",
+    0x08AE: u"ClearJump Lightwave Lossless",
+    0x1000: u"Olivetti GSM",
+    0x1001: u"Olivetti ADPCM",
+    0x1002: u"Olivetti CELP",
+    0x1003: u"Olivetti SBC",
+    0x1004: u"Olivetti OPR",
+    0x1100: u"Lernout & Hauspie",
+    0x1101: u"Lernout & Hauspie CELP",
+    0x1102: u"Lernout & Hauspie SBC8",
+    0x1103: u"Lernout & Hauspie SBC12",
+    0x1104: u"Lernout & Hauspie SBC16",
+    0x1400: u"Norris Communication",
+    0x1401: u"ISIAudio",
+    0x1500: u"AT&T Labs Soundspace Music Compression",
+    0x1600: u"Microsoft MPEG ADTS AAC",
+    0x1601: u"Microsoft MPEG RAW AAC",
+    0x1608: u"Nokia MPEG ADTS AAC",
+    0x1609: u"Nokia MPEG RAW AAC",
+    0x181C: u"VoxWare MetaVoice RT24",
+    0x1971: u"Sonic Foundry Lossless",
+    0x1979: u"Innings Telecom ADPCM",
+    0x1FC4: u"NTCSoft ALF2CD ACM",
+    0x2000: u"Dolby AC3",
+    0x2001: u"DTS",
+    0x4143: u"Divio AAC",
+    0x4201: u"Nokia Adaptive Multi-Rate",
+    0x4243: u"Divio G.726",
+    0x4261: u"ITU-T H.261",
+    0x4263: u"ITU-T H.263",
+    0x4264: u"ITU-T H.264",
+    0x674F: u"Ogg Vorbis Mode 1",
+    0x6750: u"Ogg Vorbis Mode 2",
+    0x6751: u"Ogg Vorbis Mode 3",
+    0x676F: u"Ogg Vorbis Mode 1+",
+    0x6770: u"Ogg Vorbis Mode 2+",
+    0x6771: u"Ogg Vorbis Mode 3+",
+    0x7000: u"3COM NBX Audio",
+    0x706D: u"FAAD AAC Audio",
+    0x77A1: u"True Audio Lossless Audio",
+    0x7A21: u"GSM-AMR CBR 3GPP Audio",
+    0x7A22: u"GSM-AMR VBR 3GPP Audio",
+    0xA100: u"Comverse Infosys G723.1",
+    0xA101: u"Comverse Infosys AVQSBC",
+    0xA102: u"Comverse Infosys SBC",
+    0xA103: u"Symbol Technologies G729a",
+    0xA104: u"VoiceAge AMR WB",
+    0xA105: u"Ingenient Technologies G.726",
+    0xA106: u"ISO/MPEG-4 Advanced Audio Coding (AAC)",
+    0xA107: u"Encore Software Ltd's G.726",
+    0xA108: u"ZOLL Medical Corporation ASAO",
+    0xA109: u"Speex Voice",
+    0xA10A: u"Vianix MASC Speech Compression",
+    0xA10B: u"Windows Media 9 Spectrum Analyzer Output",
+    0xA10C: u"Media Foundation Spectrum Analyzer Output",
+    0xA10D: u"GSM 6.10 (Full-Rate) Speech",
+    0xA10E: u"GSM 6.20 (Half-Rate) Speech",
+    0xA10F: u"GSM 6.60 (Enchanced Full-Rate) Speech",
+    0xA110: u"GSM 6.90 (Adaptive Multi-Rate) Speech",
+    0xA111: u"GSM Adaptive Multi-Rate WideBand Speech",
+    0xA112: u"Polycom G.722",
+    0xA113: u"Polycom G.728",
+    0xA114: u"Polycom G.729a",
+    0xA115: u"Polycom Siren",
+    0xA116: u"Global IP Sound ILBC",
+    0xA117: u"Radio Time Time Shifted Radio",
+    0xA118: u"Nice Systems ACA",
+    0xA119: u"Nice Systems ADPCM",
+    0xA11A: u"Vocord Group ITU-T G.721",
+    0xA11B: u"Vocord Group ITU-T G.726",
+    0xA11C: u"Vocord Group ITU-T G.722.1",
+    0xA11D: u"Vocord Group ITU-T G.728",
+    0xA11E: u"Vocord Group ITU-T G.729",
+    0xA11F: u"Vocord Group ITU-T G.729a",
+    0xA120: u"Vocord Group ITU-T G.723.1",
+    0xA121: u"Vocord Group LBC",
+    0xA122: u"Nice G.728",
+    0xA123: u"France Telecom G.729 ACM Audio",
+    0xA124: u"CODIAN Audio",
+    0xCC12: u"Intel YUV12 Codec",
+    0xCFCC: u"Digital Processing Systems Perception Motion JPEG",
+    0xD261: u"DEC H.261",
+    0xD263: u"DEC H.263",
+    0xFFFE: u"Extensible Wave Format",
+    0xFFFF: u"Unregistered",
+}
@@ -0,0 +1,358 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2017  Boris Pruessmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+"""Read and write DSF audio stream information and tags."""
+
+
+import sys
+import struct
+
+from ._compat import cBytesIO, reraise, endswith
+
+from mutagen import FileType, StreamInfo
+from mutagen._util import cdata, MutagenError, loadfile, convert_error
+from mutagen.id3 import ID3
+from mutagen.id3._util import ID3NoHeaderError, error as ID3Error
+
+
+__all__ = ["DSF", "Open", "delete"]
+
+
+class error(MutagenError):
+    pass
+
+
+class DSFChunk(object):
+    """A generic chunk of a DSFFile."""
+
+    chunk_offset = 0
+    chunk_header = "    "
+    chunk_size = -1
+
+    def __init__(self, fileobj, create=False):
+        self.fileobj = fileobj
+
+        if not create:
+            self.chunk_offset = fileobj.tell()
+            self.load()
+
+    def load(self):
+        raise NotImplementedError
+
+    def write(self):
+        raise NotImplementedError
+
+
+class DSDChunk(DSFChunk):
+    """Represents the first chunk of a DSF file"""
+
+    CHUNK_SIZE = 28
+
+    total_size = 0
+    offset_metdata_chunk = 0
+
+    def __init__(self, fileobj, create=False):
+        super(DSDChunk, self).__init__(fileobj, create)
+
+        if create:
+            self.chunk_header = b"DSD "
+            self.chunk_size = DSDChunk.CHUNK_SIZE
+
+    def load(self):
+        data = self.fileobj.read(DSDChunk.CHUNK_SIZE)
+        if len(data) != DSDChunk.CHUNK_SIZE:
+            raise error("DSF chunk truncated")
+
+        self.chunk_header = data[0:4]
+        if self.chunk_header != b"DSD ":
+            raise error("DSF dsd header not found")
+
+        self.chunk_size = cdata.ulonglong_le(data[4:12])
+        if self.chunk_size != DSDChunk.CHUNK_SIZE:
+            raise error("DSF dsd header size mismatch")
+
+        self.total_size = cdata.ulonglong_le(data[12:20])
+        self.offset_metdata_chunk = cdata.ulonglong_le(data[20:28])
+
+    def write(self):
+        f = cBytesIO()
+        f.write(self.chunk_header)
+        f.write(struct.pack("<Q", DSDChunk.CHUNK_SIZE))
+        f.write(struct.pack("<Q", self.total_size))
+        f.write(struct.pack("<Q", self.offset_metdata_chunk))
+
+        self.fileobj.seek(self.chunk_offset)
+        self.fileobj.write(f.getvalue())
+
+    def pprint(self):
+        return (u"DSD Chunk (Total file size = %d, "
+                u"Pointer to Metadata chunk = %d)" % (
+                    self.total_size, self.offset_metdata_chunk))
+
+
+class FormatChunk(DSFChunk):
+
+    CHUNK_SIZE = 52
+
+    VERSION = 1
+
+    FORMAT_DSD_RAW = 0
+    """Format ID: DSD Raw"""
+
+    format_version = VERSION
+    format_id = FORMAT_DSD_RAW
+    channel_type = 1
+    channel_num = 1
+    sampling_frequency = 2822400
+    bits_per_sample = 1
+    sample_count = 0
+    block_size_per_channel = 4096
+
+    def __init__(self, fileobj, create=False):
+        super(FormatChunk, self).__init__(fileobj, create)
+
+        if create:
+            self.chunk_header = b"fmt "
+            self.chunk_size = FormatChunk.CHUNK_SIZE
+
+    def load(self):
+        data = self.fileobj.read(FormatChunk.CHUNK_SIZE)
+        if len(data) != FormatChunk.CHUNK_SIZE:
+            raise error("DSF chunk truncated")
+
+        self.chunk_header = data[0:4]
+        if self.chunk_header != b"fmt ":
+            raise error("DSF fmt header not found")
+
+        self.chunk_size = cdata.ulonglong_le(data[4:12])
+        if self.chunk_size != FormatChunk.CHUNK_SIZE:
+            raise error("DSF dsd header size mismatch")
+
+        self.format_version = cdata.uint_le(data[12:16])
+        if self.format_version != FormatChunk.VERSION:
+            raise error("Unsupported format version")
+
+        self.format_id = cdata.uint_le(data[16:20])
+        if self.format_id != FormatChunk.FORMAT_DSD_RAW:
+            raise error("Unsupported format ID")
+
+        self.channel_type = cdata.uint_le(data[20:24])
+        self.channel_num = cdata.uint_le(data[24:28])
+        self.sampling_frequency = cdata.uint_le(data[28:32])
+        self.bits_per_sample = cdata.uint_le(data[32:36])
+        self.sample_count = cdata.ulonglong_le(data[36:44])
+
+    def pprint(self):
+        return u"fmt Chunk (Channel Type = %d, Channel Num = %d, " \
+               u"Sampling Frequency = %d, %.2f seconds)" % \
+               (self.channel_type, self.channel_num, self.sampling_frequency,
+                self.length)
+
+
+class DataChunk(DSFChunk):
+
+    CHUNK_SIZE = 12
+
+    data = ""
+
+    def __init__(self, fileobj, create=False):
+        super(DataChunk, self).__init__(fileobj, create)
+
+        if create:
+            self.chunk_header = b"data"
+            self.chunk_size = DataChunk.CHUNK_SIZE
+
+    def load(self):
+        data = self.fileobj.read(DataChunk.CHUNK_SIZE)
+        if len(data) != DataChunk.CHUNK_SIZE:
+            raise error("DSF chunk truncated")
+
+        self.chunk_header = data[0:4]
+        if self.chunk_header != b"data":
+            raise error("DSF data header not found")
+
+        self.chunk_size = cdata.ulonglong_le(data[4:12])
+        if self.chunk_size < DataChunk.CHUNK_SIZE:
+            raise error("DSF data header size mismatch")
+
+    def pprint(self):
+        return u"data Chunk (Chunk Offset = %d, Chunk Size = %d)" % (
+            self.chunk_offset, self.chunk_size)
+
+
+class _DSFID3(ID3):
+    """A DSF file with ID3v2 tags"""
+
+    @convert_error(IOError, error)
+    def _pre_load_header(self, fileobj):
+        fileobj.seek(0)
+        id3_location = DSDChunk(fileobj).offset_metdata_chunk
+        if id3_location == 0:
+            raise ID3NoHeaderError("File has no existing ID3 tag")
+
+        fileobj.seek(id3_location)
+
+    @convert_error(IOError, error)
+    @loadfile(writable=True)
+    def save(self, filething, v2_version=4, v23_sep='/', padding=None):
+        """Save ID3v2 data to the DSF file"""
+
+        fileobj = filething.fileobj
+        fileobj.seek(0)
+
+        dsd_header = DSDChunk(fileobj)
+        if dsd_header.offset_metdata_chunk == 0:
+            # create a new ID3 chunk at the end of the file
+            fileobj.seek(0, 2)
+
+            # store reference to ID3 location
+            dsd_header.offset_metdata_chunk = fileobj.tell()
+            dsd_header.write()
+
+        try:
+            data = self._prepare_data(
+                fileobj, dsd_header.offset_metdata_chunk, self.size,
+                v2_version, v23_sep, padding)
+        except ID3Error as e:
+            reraise(error, e, sys.exc_info()[2])
+
+        fileobj.seek(dsd_header.offset_metdata_chunk)
+        fileobj.write(data)
+        fileobj.truncate()
+
+        # Update total file size
+        dsd_header.total_size = fileobj.tell()
+        dsd_header.write()
+
+
+class DSFInfo(StreamInfo):
+    """DSF audio stream information.
+
+    Information is parsed from the fmt chunk of the DSF file.
+
+    Attributes:
+        length (`float`): audio length, in seconds.
+        channels (`int`): The number of audio channels.
+        sample_rate (`int`):
+            Sampling frequency, in Hz.
+            (2822400, 5644800, 11289600, or 22579200)
+        bits_per_sample (`int`): The audio sample size.
+        bitrate (`int`): The audio bitrate.
+    """
+
+    def __init__(self, fmt_chunk):
+        self.fmt_chunk = fmt_chunk
+
+    @property
+    def length(self):
+        return float(self.fmt_chunk.sample_count) / self.sample_rate
+
+    @property
+    def channels(self):
+        return self.fmt_chunk.channel_num
+
+    @property
+    def sample_rate(self):
+        return self.fmt_chunk.sampling_frequency
+
+    @property
+    def bits_per_sample(self):
+        return self.fmt_chunk.bits_per_sample
+
+    @property
+    def bitrate(self):
+        return self.sample_rate * self.bits_per_sample * self.channels
+
+    def pprint(self):
+        return u"%d channel DSF @ %d bits, %s Hz, %.2f seconds" % (
+            self.channels, self.bits_per_sample, self.sample_rate, self.length)
+
+
+class DSFFile(object):
+
+    dsd_chunk = None
+    fmt_chunk = None
+    data_chunk = None
+
+    def __init__(self, fileobj):
+        self.dsd_chunk = DSDChunk(fileobj)
+        self.fmt_chunk = FormatChunk(fileobj)
+        self.data_chunk = DataChunk(fileobj)
+
+
+class DSF(FileType):
+    """An DSF audio file.
+
+    Arguments:
+        filething (filething)
+
+    Attributes:
+        info (`DSFInfo`)
+        tags (`mutagen.id3.ID3Tags` or `None`)
+    """
+
+    _mimes = ["audio/dsf"]
+
+    @staticmethod
+    def score(filename, fileobj, header):
+        return header.startswith(b"DSD ") * 2 + \
+            endswith(filename.lower(), ".dsf")
+
+    def add_tags(self):
+        """Add a DSF tag block to the file."""
+
+        if self.tags is None:
+            self.tags = _DSFID3()
+        else:
+            raise error("an ID3 tag already exists")
+
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething, **kwargs):
+        dsf_file = DSFFile(filething.fileobj)
+
+        try:
+            self.tags = _DSFID3(filething.fileobj, **kwargs)
+        except ID3NoHeaderError:
+            self.tags = None
+        except ID3Error as e:
+            raise error(e)
+        else:
+            self.tags.filename = self.filename
+
+        self.info = DSFInfo(dsf_file.fmt_chunk)
+
+    @loadfile(writable=True)
+    def delete(self, filething):
+        self.tags = None
+        delete(filething)
+
+
+@convert_error(IOError, error)
+@loadfile(method=False, writable=True)
+def delete(filething):
+    """Remove tags from a file.
+
+    Args:
+        filething (filething)
+    Raises:
+        mutagen.MutagenError
+    """
+
+    dsf_file = DSFFile(filething.fileobj)
+
+    if dsf_file.dsd_chunk.offset_metdata_chunk != 0:
+        id3_location = dsf_file.dsd_chunk.offset_metdata_chunk
+        dsf_file.dsd_chunk.offset_metdata_chunk = 0
+        dsf_file.dsd_chunk.write()
+
+        filething.fileobj.seek(id3_location)
+        filething.fileobj.truncate()
+
+
+Open = DSF
@@ -1,10 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2006  Joe Wreschnig
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Easier access to ID3 tags.

@@ -16,7 +16,7 @@ import mutagen.id3

 from ._compat import iteritems, text_type, PY2
 from mutagen import Metadata
-from mutagen._util import DictMixin, dict_match
+from mutagen._util import DictMixin, dict_match, loadfile
 from mutagen.id3 import ID3, error, delete, ID3FileType


@@ -32,7 +32,9 @@ class EasyID3KeyError(KeyError, ValueError, error):


 class EasyID3(DictMixin, Metadata):
-    """A file with an ID3 tag.
+    """EasyID3(filething=None)
+
+    A file with an ID3 tag.

    Like Vorbis comments, EasyID3 keys are case-insensitive ASCII
    strings. Only a subset of ID3 frames are supported by default. Use
@@ -148,19 +150,14 @@ class EasyID3(DictMixin, Metadata):
            return list(id3[frameid])

        def setter(id3, key, value):
-            try:
-                frame = id3[frameid]
-            except KeyError:
-                enc = 0
-                # Store 8859-1 if we can, per MusicBrainz spec.
-                for v in value:
-                    if v and max(v) > u'\x7f':
-                        enc = 3
-                        break
+            enc = 0
+            # Store 8859-1 if we can, per MusicBrainz spec.
+            for v in value:
+                if v and max(v) > u'\x7f':
+                    enc = 3
+                    break

-                id3.add(mutagen.id3.TXXX(encoding=enc, text=value, desc=desc))
-            else:
-                frame.text = value
+            id3.add(mutagen.id3.TXXX(encoding=enc, text=value, desc=desc))

        def deleter(id3, key):
            del(id3[frameid])
@@ -175,10 +172,30 @@ class EasyID3(DictMixin, Metadata):
    load = property(lambda s: s.__id3.load,
                    lambda s, v: setattr(s.__id3, 'load', v))

-    def save(self, *args, **kwargs):
-        # ignore v2_version until we support 2.3 here
-        kwargs.pop("v2_version", None)
-        self.__id3.save(*args, **kwargs)
+    @loadfile(writable=True, create=True)
+    def save(self, filething, v1=1, v2_version=4, v23_sep='/', padding=None):
+        """save(filething=None, v1=1, v2_version=4, v23_sep='/', padding=None)
+
+        Save changes to a file.
+        See :meth:`mutagen.id3.ID3.save` for more info.
+        """
+
+        if v2_version == 3:
+            # EasyID3 only works with v2.4 frames, so update_to_v23() would
+            # break things. We have to save a shallow copy of all tags
+            # and restore it after saving. Due to CHAP/CTOC copying has
+            # to be done recursively implemented in ID3Tags.
+            backup = self.__id3._copy()
+            try:
+                self.__id3.update_to_v23()
+                self.__id3.save(
+                    filething, v1=v1, v2_version=v2_version, v23_sep=v23_sep,
+                    padding=padding)
+            finally:
+                self.__id3._restore(backup)
+        else:
+            self.__id3.save(filething, v1=v1, v2_version=v2_version,
+                            v23_sep=v23_sep, padding=padding)

    delete = property(lambda s: s.__id3.delete,
                      lambda s, v: setattr(s.__id3, 'delete', v))
@@ -190,30 +207,27 @@ class EasyID3(DictMixin, Metadata):
                    lambda s, fn: setattr(s.__id3, 'size', s))

    def __getitem__(self, key):
-        key = key.lower()
-        func = dict_match(self.Get, key, self.GetFallback)
+        func = dict_match(self.Get, key.lower(), self.GetFallback)
        if func is not None:
            return func(self.__id3, key)
        else:
            raise EasyID3KeyError("%r is not a valid key" % key)

    def __setitem__(self, key, value):
-        key = key.lower()
        if PY2:
            if isinstance(value, basestring):
                value = [value]
        else:
            if isinstance(value, text_type):
                value = [value]
-        func = dict_match(self.Set, key, self.SetFallback)
+        func = dict_match(self.Set, key.lower(), self.SetFallback)
        if func is not None:
            return func(self.__id3, key, value)
        else:
            raise EasyID3KeyError("%r is not a valid key" % key)

    def __delitem__(self, key):
-        key = key.lower()
-        func = dict_match(self.Delete, key, self.DeleteFallback)
+        func = dict_match(self.Delete, key.lower(), self.DeleteFallback)
        if func is not None:
            return func(self.__id3, key)
        else:
@@ -469,7 +483,7 @@ for frameid, key in iteritems({
    "TIT2": "title",
    "TIT3": "version",
    "TPE1": "artist",
-    "TPE2": "performer",
+    "TPE2": "albumartist",
    "TPE3": "conductor",
    "TPE4": "arranger",
    "TPOS": "discnumber",
@@ -518,6 +532,7 @@ for desc, key in iteritems({
    u"MusicBrainz Disc Id": "musicbrainz_discid",
    u"ASIN": "asin",
    u"ALBUMARTISTSORT": "albumartistsort",
+    u"PERFORMER": "performer",
    u"BARCODE": "barcode",
    u"CATALOGNUMBER": "catalognumber",
    u"MusicBrainz Release Track Id": "musicbrainz_releasetrackid",
@@ -530,5 +545,15 @@ for desc, key in iteritems({


 class EasyID3FileType(ID3FileType):
-    """Like ID3FileType, but uses EasyID3 for tags."""
+    """EasyID3FileType(filething=None)
+
+    Like ID3FileType, but uses EasyID3 for tags.
+
+    Arguments:
+        filething (filething)
+
+    Attributes:
+        tags (`EasyID3`)
+    """
+
    ID3 = EasyID3
@@ -1,12 +1,12 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2009  Joe Wreschnig
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

-from mutagen import Metadata
+from mutagen import Tags
 from mutagen._util import DictMixin, dict_match
 from mutagen.mp4 import MP4, MP4Tags, error, delete
 from ._compat import PY2, text_type, PY3
@@ -19,8 +19,10 @@ class EasyMP4KeyError(error, KeyError, ValueError):
    pass


-class EasyMP4Tags(DictMixin, Metadata):
-    """A file with MPEG-4 iTunes metadata.
+class EasyMP4Tags(DictMixin, Tags):
+    """EasyMP4Tags()
+
+    A file with MPEG-4 iTunes metadata.

    Like Vorbis comments, EasyMP4Tags keys are case-insensitive ASCII
    strings, and values are a list of Unicode strings (and these lists
@@ -40,6 +42,7 @@ class EasyMP4Tags(DictMixin, Metadata):
        self.load = self.__mp4.load
        self.save = self.__mp4.save
        self.delete = self.__mp4.delete
+        self._padding = self.__mp4._padding

    filename = property(lambda s: s.__mp4.filename,
                        lambda s, fn: setattr(s.__mp4, 'filename', fn))
@@ -267,11 +270,14 @@ for name, key in {


 class EasyMP4(MP4):
-    """Like :class:`MP4 <mutagen.mp4.MP4>`,
-    but uses :class:`EasyMP4Tags` for tags.
+    """EasyMP4(filelike)

-    :ivar info: :class:`MP4Info <mutagen.mp4.MP4Info>`
-    :ivar tags: :class:`EasyMP4Tags`
+    Like :class:`MP4 <mutagen.mp4.MP4>`, but uses :class:`EasyMP4Tags` for
+    tags.
+
+    Attributes:
+        info (`mutagen.mp4.MP4Info`)
+        tags (`EasyMP4Tags`)
    """

    MP4Tags = EasyMP4Tags
@@ -1,10 +1,10 @@
 # -*- coding: utf-8 -*-
-
 # Copyright (C) 2005  Joe Wreschnig
 #
 # This program is free software; you can redistribute it and/or modify
-# it under the terms of version 2 of the GNU General Public License as
-# published by the Free Software Foundation.
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.

 """Read and write FLAC Vorbis comments and stream information.

@@ -26,13 +26,15 @@ import struct
 from ._vorbis import VCommentDict
 import mutagen

-from ._compat import cBytesIO, endswith, chr_
-from mutagen._util import insert_bytes, MutagenError
-from mutagen.id3 import BitPaddedInt
+from ._compat import cBytesIO, endswith, chr_, xrange
+from mutagen._util import resize_bytes, MutagenError, get_size, loadfile, \
+    convert_error
+from mutagen._tags import PaddingInfo
+from mutagen.id3._util import BitPaddedInt
 from functools import reduce


-class error(IOError, MutagenError):
+class error(MutagenError):
    pass


@@ -56,7 +58,8 @@ class StrictFileObject(object):

    def __init__(self, fileobj):
        self._fileobj = fileobj
-        for m in ["close", "tell", "seek", "write", "name"]:
+        for m in ["close", "tell", "seek", "write", "name", "flush",
+                  "truncate"]:
            if hasattr(fileobj, m):
                setattr(self, m, getattr(fileobj, m))

@@ -78,11 +81,19 @@ class MetadataBlock(object):
    blocks, and also as a container for data blobs of unknown blocks.

    Attributes:
-
-    * data -- raw binary data for this block
+        data (`bytes`): raw binary data for this block
    """

    _distrust_size = False
+    """For block types setting this, we don't trust the size field and
+    use the size of the content instead."""
+
+    _invalid_overflow_size = -1
+    """In case the real size was bigger than what is representable by the
+    24 bit size field, we save the wrong specified size here. This can
+    only be set if _distrust_size is True"""
+
+    _MAX_SIZE = 2 ** 24 - 1

    def __init__(self, data):
        """Parse the given data string or file-like as a metadata block.
@@ -103,41 +114,64 @@ class MetadataBlock(object):
    def write(self):
        return self.data

-    @staticmethod
-    def writeblocks(blocks):
-        """Render metadata block as a byte string."""
-        data = []
-        codes = [[block.code, block.write()] for block in blocks]
-        codes[-1][0] |= 128
-        for code, datum in codes:
-            byte = chr_(code)
-            if len(datum) > 2 ** 24:
-                raise error("block is too long to write")
-            length = struct.pack(">I", len(datum))[-3:]
-            data.append(byte + length + datum)
-        return b"".join(data)
+    @classmethod
+    def _writeblock(cls, block, is_last=False):
+        """Returns the block content + header.

-    @staticmethod
-    def group_padding(blocks):
-        """Consolidate FLAC padding metadata blocks.
-
-        The overall size of the rendered blocks does not change, so
-        this adds several bytes of padding for each merged block.
+        Raises error.
        """

-        paddings = [b for b in blocks if isinstance(b, Padding)]
-        for p in paddings:
-            blocks.remove(p)
-        # total padding size is the sum of padding sizes plus 4 bytes
-        # per removed header.
-        size = sum(padding.length for padding in paddings)
-        padding = Padding()
-        padding.length = size + 4 * (len(paddings) - 1)
-        blocks.append(padding)
+        data = bytearray()
+        code = (block.code | 128) if is_last else block.code
+        datum = block.write()
+        size = len(datum)
+        if size > cls._MAX_SIZE:
+            if block._distrust_size and block._invalid_overflow_size != -1:
+                # The original size of this block was (1) wrong and (2)
+                # the real size doesn't allow us to save the file
+                # according to the spec (too big for 24 bit uint). Instead
+                # simply write back the original wrong size.. at least
+                # we don't make the file more "broken" as it is.
+                size = block._invalid_overflow_size
+            else:
+                raise error("block is too long to write")
+        assert not size > cls._MAX_SIZE
+        length = struct.pack(">I", size)[-3:]
+        data.append(code)
+        data += length
+        data += datum
+        return data
+
+    @classmethod
+    def _writeblocks(cls, blocks, available, cont_size, padding_func):
+        """Render metadata block as a byte string."""
+
+        # write everything except padding
+        data = bytearray()
+        for block in blocks:
+            if isinstance(block, Padding):
+                continue
+            data += cls._writeblock(block)
+        blockssize = len(data)
+
+        # take the padding overhead into account. we always add one
+        # to make things simple.
+        padding_block = Padding()
+        blockssize += len(cls._writeblock(padding_block))
+
+        # finally add a padding block
+        info = PaddingInfo(available - blockssize, cont_size)
+        padding_block.length = min(info._get_padding(padding_func),
+                                   cls._MAX_SIZE)
+        data += cls._writeblock(padding_block, is_last=True)
+
+        return data


 class StreamInfo(MetadataBlock, mutagen.StreamInfo):
-    """FLAC stream information.
+    """StreamInfo()
+
+    FLAC stream information.

    This contains information about the audio data in the FLAC file.
    Unlike most stream information objects in Mutagen, changes to this
@@ -146,17 +180,18 @@ class StreamInfo(MetadataBlock, mutagen.StreamInfo):
    attributes of this block.

    Attributes:
-
-    * min_blocksize -- minimum audio block size
-    * max_blocksize -- maximum audio block size
-    * sample_rate -- audio sample rate in Hz
-    * channels -- audio channels (1 for mono, 2 for stereo)
-    * bits_per_sample -- bits per sample
-    * total_samples -- total samples in file
-    * length -- audio length in seconds
+        min_blocksize (`int`): minimum audio block size
+        max_blocksize (`int`): maximum audio block size
+        sample_rate (`int`): audio sample rate in Hz
+        channels (`int`): audio channels (1 for mono, 2 for stereo)
+        bits_per_sample (`int`): bits per sample
+        total_samples (`int`): total samples in file
+        length (`float`): audio length in seconds
+        bitrate (`int`): bitrate in bits per second, as an int
    """

    code = 0
+    bitrate = 0

    def __eq__(self, other):
        try:
@@ -224,11 +259,13 @@ class StreamInfo(MetadataBlock, mutagen.StreamInfo):
        return f.getvalue()

    def pprint(self):
-        return "FLAC, %.2f seconds, %d Hz" % (self.length, self.sample_rate)
+        return u"FLAC, %.2f seconds, %d Hz" % (self.length, self.sample_rate)


 class SeekPoint(tuple):
-    """A single seek point in a FLAC file.
+    """SeekPoint()
+
+    A single seek point in a FLAC file.

    Placeholder seek points have first_sample of 0xFFFFFFFFFFFFFFFFL,
    and byte_offset and num_samples undefined. Seek points must be
@@ -238,10 +275,9 @@ class SeekPoint(tuple):
    may be any number of them.

    Attributes:
-
-    * first_sample -- sample number of first sample in the target frame
-    * byte_offset -- offset from first frame to target frame
-    * num_samples -- number of samples in target frame
+        first_sample (`int`): sample number of first sample in the target frame
+        byte_offset (`int`): offset from first frame to target frame
+        num_samples (`int`): number of samples in target frame
    """

    def __new__(cls, first_sample, byte_offset, num_samples):
@@ -257,8 +293,7 @@ class SeekTable(MetadataBlock):
    """Read and write FLAC seek tables.

    Attributes:
-
-    * seekpoints -- list of SeekPoint objects
+        seekpoints: list of SeekPoint objects
    """

    __SEEKPOINT_FORMAT = '>QQH'
@@ -301,7 +336,9 @@ class SeekTable(MetadataBlock):


 class VCFLACDict(VCommentDict):
-    """Read and write FLAC Vorbis comments.
+    """VCFLACDict()
+
+    Read and write FLAC Vorbis comments.

    FLACs don't use the framing bit at the end of the comment block.
    So this extends VCommentDict to not use the framing bit.
@@ -318,7 +355,9 @@ class VCFLACDict(VCommentDict):


 class CueSheetTrackIndex(tuple):
-    """Index for a track in a cuesheet.
+    """CueSheetTrackIndex(index_number, index_offset)
+
+    Index for a track in a cuesheet.

    For CD-DA, an index_number of 0 corresponds to the track
    pre-gap. The first index in a track must have a number of 0 or 1,
@@ -327,9 +366,8 @@ class CueSheetTrackIndex(tuple):
    divisible by 588 samples.

    Attributes:
-
-    * index_number -- index point number
-    * index_offset -- offset in samples from track start
+        index_number (`int`): index point number
+        index_offset (`int`): offset in samples from track start
    """

    def __new__(cls, index_number, index_offset):
@@ -341,7 +379,9 @@ class CueSheetTrackIndex(tuple):


 class CueSheetTrack(object):
-    """A track in a cuesheet.
+    """CueSheetTrack()
+
+    A track in a cuesheet.

    For CD-DA, track_numbers must be 1-99, or 170 for the
    lead-out. Track_numbers must be unique within a cue sheet. There
@@ -349,13 +389,13 @@ class CueSheetTrack(object):
    which must have none.

    Attributes:
-
-    * track_number -- track number
-    * start_offset -- track offset in samples from start of FLAC stream
-    * isrc -- ISRC code
-    * type -- 0 for audio, 1 for digital data
-    * pre_emphasis -- true if the track is recorded with pre-emphasis
-    * indexes -- list of CueSheetTrackIndex objects
+        track_number (`int`): track number
+        start_offset (`int`): track offset in samples from start of FLAC stream
+        isrc (`text`): ISRC code, exactly 12 characters
+        type (`int`): 0 for audio, 1 for digital data
+        pre_emphasis (`bool`): true if the track is recorded with pre-emphasis
+        indexes (List[`mutagen.flac.CueSheetTrackIndex`]):
+            list of CueSheetTrackIndex objects
    """

    def __init__(self, track_number, start_offset, isrc='', type_=0,
@@ -388,19 +428,24 @@ class CueSheetTrack(object):


 class CueSheet(MetadataBlock):
-    """Read and write FLAC embedded cue sheets.
+    """CueSheet()
+
+    Read and write FLAC embedded cue sheets.

    Number of tracks should be from 1 to 100. There should always be
    exactly one lead-out track and that track must be the last track
    in the cue sheet.

    Attributes:
-
-    * media_catalog_number -- media catalog number in ASCII
-    * lead_in_samples -- number of lead-in samples
-    * compact_disc -- true if the cuesheet corresponds to a compact disc
-    * tracks -- list of CueSheetTrack objects
-    * lead_out -- lead-out as CueSheetTrack or None if lead-out was not found
+        media_catalog_number (`text`): media catalog number in ASCII,
+            up to 128 characters
+        lead_in_samples (`int`): number of lead-in samples
+        compact_disc (`bool`): true if the cuesheet corresponds to a
+            compact disc
+        tracks (List[`mutagen.flac.CueSheetTrack`]):
+            list of CueSheetTrack objects
+        lead_out (`mutagen.flac.CueSheetTrack` or `None`):
+            lead-out as CueSheetTrack or None if lead-out was not found
    """

    __CUESHEET_FORMAT = '>128sQB258xB'
@@ -439,7 +484,7 @@ class CueSheet(MetadataBlock):
        self.lead_in_samples = lead_in_samples
        self.compact_disc = bool(flags & 0x80)
        self.tracks = []
-        for i in range(num_tracks):
+        for i in xrange(num_tracks):
            track = data.read(self.__CUESHEET_TRACK_SIZE)
            start_offset, track_number, isrc_padded, flags, num_indexes = \
                struct.unpack(self.__CUESHEET_TRACK_FORMAT, track)
@@ -448,7 +493,7 @@ class CueSheet(MetadataBlock):
            pre_emphasis = bool(flags & 0x40)
            val = CueSheetTrack(
                track_number, start_offset, isrc, type_, pre_emphasis)
-            for j in range(num_indexes):
+            for j in xrange(num_indexes):
                index = data.read(self.__CUESHEET_TRACKINDEX_SIZE)
                index_offset, index_number = struct.unpack(
                    self.__CUESHEET_TRACKINDEX_FORMAT, index)
@@ -490,19 +535,38 @@ class CueSheet(MetadataBlock):


 class Picture(MetadataBlock):
-    """Read and write FLAC embed pictures.
+    """Picture()
+
+    Read and write FLAC embed pictures.
+
+    .. currentmodule:: mutagen

    Attributes:
+        type (`id3.PictureType`): picture type
+            (same as types for ID3 APIC frames)
+        mime (`text`): MIME type of the picture
+        desc (`text`): picture's description
+        width (`int`): width in pixels
+        height (`int`): height in pixels
+        depth (`int`): color depth in bits-per-pixel
+        colors (`int`): number of colors for indexed palettes (like GIF),
+            0 for non-indexed
+        data (`bytes`): picture data

-    * type -- picture type (same as types for ID3 APIC frames)
-    * mime -- MIME type of the picture
-    * desc -- picture's description
-    * width -- width in pixels
-    * height -- height in pixels
-    * depth -- color depth in bits-per-pixel
-    * colors -- number of colors for indexed palettes (like GIF),
-      0 for non-indexed
-    * data -- picture data
+    To create a picture from file (in order to add to a FLAC file),
+    instantiate this object without passing anything to the constructor and
+    then set the properties manually::
+
+        p = Picture()
+
+        with open("Folder.jpg", "rb") as f:
+            pic.data = f.read()
+
+        pic.type = id3.PictureType.COVER_FRONT
+        pic.mime = u"image/jpeg"
+        pic.width = 500
+        pic.height = 500
+        pic.depth = 16 # color depth
    """

    code = 6
@@ -562,12 +626,16 @@ class Picture(MetadataBlock):


 class Padding(MetadataBlock):
-    """Empty padding space for metadata blocks.
+    """Padding()
+
+    Empty padding space for metadata blocks.

    To avoid rewriting the entire FLAC file when editing comments,
    metadata is often padded. Padding should occur at the end, and no
-    more than one padding block should be in any FLAC file. Mutagen
-    handles this with MetadataBlock.group_padding.
+    more than one padding block should be in any FLAC file.
+
+    Attributes:
+        length (`int`): length
    """

    code = 1
@@ -600,18 +668,25 @@ class Padding(MetadataBlock):


 class FLAC(mutagen.FileType):
-    """A FLAC audio file.
+    """FLAC(filething)
+
+    A FLAC audio file.
+
+    Args:
+        filething (filething)

    Attributes:
-
-    * info -- stream information (length, bitrate, sample rate)
-    * tags -- metadata tags, if any
-    * cuesheet -- CueSheet object, if any
-    * seektable -- SeekTable object, if any
-    * pictures -- list of embedded pictures
+        cuesheet (`CueSheet`): if any or `None`
+        seektable (`SeekTable`): if any or `None`
+        pictures (List[`Picture`]): list of embedded pictures
+        info (`StreamInfo`)
+        tags (`mutagen._vorbis.VCommentDict`)
    """

-    _mimes = ["audio/x-flac", "application/x-flac"]
+    _mimes = ["audio/flac", "audio/x-flac", "application/x-flac"]
+
+    info = None
+    tags = None

    METADATA_BLOCKS = [StreamInfo, Padding, None, SeekTable, VCFLACDict,
                       CueSheet, Picture]
@@ -640,10 +715,14 @@ class FLAC(mutagen.FileType):
            # so we have to too.  Instead of parsing the size
            # given, parse an actual Vorbis comment, leaving
            # fileobj in the right position.
-            # http://code.google.com/p/mutagen/issues/detail?id=52
+            # https://github.com/quodlibet/mutagen/issues/52
            # ..same for the Picture block:
-            # http://code.google.com/p/mutagen/issues/detail?id=106
+            # https://github.com/quodlibet/mutagen/issues/106
+            start = fileobj.tell()
            block = block_type(fileobj)
+            real_size = fileobj.tell() - start
+            if real_size > MetadataBlock._MAX_SIZE:
+                block._invalid_overflow_size = size
        else:
            data = fileobj.read(size)
            block = block_type(data)
@@ -677,49 +756,63 @@ class FLAC(mutagen.FileType):

    add_vorbiscomment = add_tags

-    def delete(self, filename=None):
+    @loadfile(writable=True)
+    def delete(self, filething):
        """Remove Vorbis comments from a file.

        If no filename is given, the one most recently loaded is used.
        """
-        if filename is None:
-            filename = self.filename
-        for s in list(self.metadata_blocks):
-            if isinstance(s, VCFLACDict):
-                self.metadata_blocks.remove(s)
-                self.tags = None
-                self.save()
-                break
+
+        if self.tags is not None:
+            self.metadata_blocks.remove(self.tags)
+            try:
+                self.save(filething, padding=lambda x: 0)
+            finally:
+                self.metadata_blocks.append(self.tags)
+            self.tags.clear()

    vc = property(lambda s: s.tags, doc="Alias for tags; don't use this.")

-    def load(self, filename):
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething):
        """Load file information from a filename."""

+        fileobj = filething.fileobj
+
        self.metadata_blocks = []
        self.tags = None
        self.cuesheet = None
        self.seektable = None
-        self.filename = filename
-        fileobj = StrictFileObject(open(filename, "rb"))
-        try:
-            self.__check_header(fileobj)
-            while self.__read_metadata_block(fileobj):
-                pass
-        finally:
-            fileobj.close()
+
+        fileobj = StrictFileObject(fileobj)
+        self.__check_header(fileobj, filething.name)
+        while self.__read_metadata_block(fileobj):
+            pass

        try:
            self.metadata_blocks[0].length
        except (AttributeError, IndexError):
            raise FLACNoHeaderError("Stream info block not found")

+        if self.info.length:
+            start = fileobj.tell()
+            fileobj.seek(0, 2)
+            self.info.bitrate = int(
+                float(fileobj.tell() - start) * 8 / self.info.length)
+        else:
+            self.info.bitrate = 0
+
    @property
    def info(self):
        return self.metadata_blocks[0]

    def add_picture(self, picture):
-        """Add a new picture to the file."""
+        """Add a new picture to the file.
+
+        Args:
+            picture (Picture)
+        """
        self.metadata_blocks.append(picture)

    def clear_pictures(self):
@@ -730,71 +823,58 @@ class FLAC(mutagen.FileType):

    @property
    def pictures(self):
-        """List of embedded pictures"""
+        """
+        Returns:
+            List[`Picture`]: List of embedded pictures
+        """

        return [b for b in self.metadata_blocks if b.code == Picture.code]

-    def save(self, filename=None, deleteid3=False):
+    @convert_error(IOError, error)
+    @loadfile(writable=True)
+    def save(self, filething, deleteid3=False, padding=None):
        """Save metadata blocks to a file.

+        Args:
+            filething (filething)
+            deleteid3 (bool): delete id3 tags while at it
+            padding (PaddingFunction)
+
        If no filename is given, the one most recently loaded is used.
        """

-        if filename is None:
-            filename = self.filename
-        f = open(filename, 'rb+')
+        f = StrictFileObject(filething.fileobj)
+        header = self.__check_header(f, filething.name)
+        audio_offset = self.__find_audio_offset(f)
+        # "fLaC" and maybe ID3
+        available = audio_offset - header

-        try:
-            # Ensure we've got padding at the end, and only at the end.
-            # If adding makes it too large, we'll scale it down later.
-            self.metadata_blocks.append(Padding(b'\x00' * 1020))
-            MetadataBlock.group_padding(self.metadata_blocks)
+        # Delete ID3v2
+        if deleteid3 and header > 4:
+            available += header - 4
+            header = 4

-            header = self.__check_header(f)
-            # "fLaC" and maybe ID3
-            available = self.__find_audio_offset(f) - header
-            data = MetadataBlock.writeblocks(self.metadata_blocks)
+        content_size = get_size(f) - audio_offset
+        assert content_size >= 0
+        data = MetadataBlock._writeblocks(
+            self.metadata_blocks, available, content_size, padding)
+        data_size = len(data)

-            # Delete ID3v2
-            if deleteid3 and header > 4:
-                available += header - 4
-                header = 4
+        resize_bytes(filething.fileobj, available, data_size, header)
+        f.seek(header - 4)
+        f.write(b"fLaC")
+        f.write(data)

-            if len(data) > available:
-                # If we have too much data, see if we can reduce padding.
-                padding = self.metadata_blocks[-1]
-                newlength = padding.length - (len(data) - available)
-                if newlength > 0:
-                    padding.length = newlength
-                    data = MetadataBlock.writeblocks(self.metadata_blocks)
-                    assert len(data) == available
-
-            elif len(data) < available:
-                # If we have too little data, increase padding.
-                self.metadata_blocks[-1].length += (available - len(data))
-                data = MetadataBlock.writeblocks(self.metadata_blocks)
-                assert len(data) == available
-
-            if len(data) != available:
-                # We couldn't reduce the padding enough.
-                diff = (len(data) - available)
-                insert_bytes(f, diff, header)
-
-            f.seek(header - 4)
-            f.write(b"fLaC" + data)
-
-            # Delete ID3v1
-            if deleteid3:
-                try:
+        # Delete ID3v1
+        if deleteid3:
+            try:
+                f.seek(-128, 2)
+            except IOError:
+                pass
+            else:
+                if f.read(3) == b"TAG":
                    f.seek(-128, 2)
-                except IOError:
-                    pass
-                else:
-                    if f.read(3) == b"TAG":
-                        f.seek(-128, 2)
-                        f.truncate()
-        finally:
-            f.close()
+                    f.truncate()

    def __find_audio_offset(self, fileobj):
        byte = 0x00
@@ -814,7 +894,12 @@ class FLAC(mutagen.FileType):
                fileobj.read(size)
        return fileobj.tell()

-    def __check_header(self, fileobj):
+    def __check_header(self, fileobj, name):
+        """Returns the offset of the flac block start
+        (skipping id3 tags if found). The passed fileobj will be advanced to
+        that offset as well.
+        """
+
        size = 4
        header = fileobj.read(4)
        if header != b"fLaC":
@@ -826,13 +911,24 @@ class FLAC(mutagen.FileType):
                    size = None
        if size is None:
            raise FLACNoHeaderError(
-                "%r is not a valid FLAC file" % fileobj.name)
+                "%r is not a valid FLAC file" % name)
        return size


 Open = FLAC


-def delete(filename):
-    """Remove tags from a file."""
-    FLAC(filename).delete()
+@convert_error(IOError, error)
+@loadfile(method=False, writable=True)
+def delete(filething):
+    """Remove tags from a file.
+
+    Args:
+        filething (filething)
+    Raises:
+        mutagen.MutagenError
+    """
+
+    f = FLAC(filething)
+    filething.fileobj.seek(0)
+    f.delete(filething)
@@ -0,0 +1,406 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005  Michael Urman
+#               2006  Lukas Lalinsky
+#               2013  Christoph Reiter
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import struct
+
+import mutagen
+from mutagen._util import insert_bytes, delete_bytes, enum, \
+    loadfile, convert_error, read_full
+from mutagen._tags import PaddingInfo
+
+from ._util import error, ID3NoHeaderError, ID3UnsupportedVersionError, \
+    BitPaddedInt
+from ._tags import ID3Tags, ID3Header, ID3SaveConfig
+from ._id3v1 import MakeID3v1, find_id3v1
+
+
+@enum
+class ID3v1SaveOptions(object):
+
+    REMOVE = 0
+    """ID3v1 tags will be removed"""
+
+    UPDATE = 1
+    """ID3v1 tags will be updated but not added"""
+
+    CREATE = 2
+    """ID3v1 tags will be created and/or updated"""
+
+
+class ID3(ID3Tags, mutagen.Metadata):
+    """ID3(filething=None)
+
+    A file with an ID3v2 tag.
+
+    If any arguments are given, the :meth:`load` is called with them. If no
+    arguments are given then an empty `ID3` object is created.
+
+    ::
+
+        ID3("foo.mp3")
+        # same as
+        t = ID3()
+        t.load("foo.mp3")
+
+    Arguments:
+        filething (filething): or `None`
+
+    Attributes:
+        version (Tuple[int]): ID3 tag version as a tuple
+        unknown_frames (List[bytes]): raw frame data of any unknown frames
+            found
+        size (int): the total size of the ID3 tag, including the header
+    """
+
+    __module__ = "mutagen.id3"
+
+    PEDANTIC = True
+    """`bool`:
+
+    .. deprecated:: 1.28
+
+        Doesn't have any effect
+    """
+
+    filename = None
+
+    def __init__(self, *args, **kwargs):
+        self._header = None
+        self._version = (2, 4, 0)
+        super(ID3, self).__init__(*args, **kwargs)
+
+    @property
+    def version(self):
+        """`tuple`: ID3 tag version as a tuple (of the loaded file)"""
+
+        if self._header is not None:
+            return self._header.version
+        return self._version
+
+    @version.setter
+    def version(self, value):
+        self._version = value
+
+    @property
+    def f_unsynch(self):
+        if self._header is not None:
+            return self._header.f_unsynch
+        return False
+
+    @property
+    def f_extended(self):
+        if self._header is not None:
+            return self._header.f_extended
+        return False
+
+    @property
+    def size(self):
+        if self._header is not None:
+            return self._header.size
+        return 0
+
+    def _pre_load_header(self, fileobj):
+        # XXX: for aiff to adjust the offset..
+        pass
+
+    @convert_error(IOError, error)
+    @loadfile()
+    def load(self, filething, known_frames=None, translate=True, v2_version=4):
+        """load(filething, known_frames=None, translate=True, v2_version=4)
+
+        Load tags from a filename.
+
+        Args:
+            filename (filething): filename or file object to load tag data from
+            known_frames (Dict[`mutagen.text`, `Frame`]): dict mapping frame
+                IDs to Frame objects
+            translate (bool): Update all tags to ID3v2.3/4 internally. If you
+                intend to save, this must be true or you have to
+                call update_to_v23() / update_to_v24() manually.
+            v2_version (int): if update_to_v23 or update_to_v24 get called
+                (3 or 4)
+
+        Example of loading a custom frame::
+
+            my_frames = dict(mutagen.id3.Frames)
+            class XMYF(Frame): ...
+            my_frames["XMYF"] = XMYF
+            mutagen.id3.ID3(filename, known_frames=my_frames)
+        """
+
+        fileobj = filething.fileobj
+
+        if v2_version not in (3, 4):
+            raise ValueError("Only 3 and 4 possible for v2_version")
+
+        self.unknown_frames = []
+        self._header = None
+        self._padding = 0
+
+        self._pre_load_header(fileobj)
+
+        try:
+            self._header = ID3Header(fileobj)
+        except (ID3NoHeaderError, ID3UnsupportedVersionError):
+            frames, offset = find_id3v1(fileobj)
+            if frames is None:
+                raise
+
+            self.version = ID3Header._V11
+            for v in frames.values():
+                self.add(v)
+        else:
+            # XXX: attach to the header object so we have it in spec parsing..
+            if known_frames is not None:
+                self._header._known_frames = known_frames
+
+            data = read_full(fileobj, self.size - 10)
+            remaining_data = self._read(self._header, data)
+            self._padding = len(remaining_data)
+
+        if translate:
+            if v2_version == 3:
+                self.update_to_v23()
+            else:
+                self.update_to_v24()
+
+    def _prepare_data(self, fileobj, start, available, v2_version, v23_sep,
+                      pad_func):
+
+        if v2_version not in (3, 4):
+            raise ValueError("Only 3 or 4 allowed for v2_version")
+
+        config = ID3SaveConfig(v2_version, v23_sep)
+        framedata = self._write(config)
+
+        needed = len(framedata) + 10
+
+        fileobj.seek(0, 2)
+        trailing_size = fileobj.tell() - start
+
+        info = PaddingInfo(available - needed, trailing_size)
+        new_padding = info._get_padding(pad_func)
+        if new_padding < 0:
+            raise error("invalid padding")
+        new_size = needed + new_padding
+
+        new_framesize = BitPaddedInt.to_str(new_size - 10, width=4)
+        header = struct.pack(
+            '>3sBBB4s', b'ID3', v2_version, 0, 0, new_framesize)
+
+        data = header + framedata
+        assert new_size >= len(data)
+        data += (new_size - len(data)) * b'\x00'
+        assert new_size == len(data)
+
+        return data
+
+    @convert_error(IOError, error)
+    @loadfile(writable=True, create=True)
+    def save(self, filething, v1=1, v2_version=4, v23_sep='/', padding=None):
+        """save(filething=None, v1=1, v2_version=4, v23_sep='/', padding=None)
+
+        Save changes to a file.
+
+        Args:
+            filename (fspath):
+                Filename to save the tag to. If no filename is given,
+                the one most recently loaded is used.
+            v1 (ID3v1SaveOptions):
+                if 0, ID3v1 tags will be removed.
+                if 1, ID3v1 tags will be updated but not added.
+                if 2, ID3v1 tags will be created and/or updated
+            v2 (int):
+                version of ID3v2 tags (3 or 4).
+            v23_sep (text):
+                the separator used to join multiple text values
+                if v2_version == 3. Defaults to '/' but if it's None
+                will be the ID3v2v2.4 null separator.
+            padding (PaddingFunction)
+
+        Raises:
+            mutagen.MutagenError
+
+        By default Mutagen saves ID3v2.4 tags. If you want to save ID3v2.3
+        tags, you must call method update_to_v23 before saving the file.
+
+        The lack of a way to update only an ID3v1 tag is intentional.
+        """
+
+        f = filething.fileobj
+
+        try:
+            header = ID3Header(filething.fileobj)
+        except ID3NoHeaderError:
+            old_size = 0
+        else:
+            old_size = header.size
+
+        data = self._prepare_data(
+            f, 0, old_size, v2_version, v23_sep, padding)
+        new_size = len(data)
+
+        if (old_size < new_size):
+            insert_bytes(f, new_size - old_size, old_size)
+        elif (old_size > new_size):
+            delete_bytes(f, old_size - new_size, new_size)
+        f.seek(0)
+        f.write(data)
+
+        self.__save_v1(f, v1)
+
+    def __save_v1(self, f, v1):
+        tag, offset = find_id3v1(f)
+        has_v1 = tag is not None
+
+        f.seek(offset, 2)
+        if v1 == ID3v1SaveOptions.UPDATE and has_v1 or \
+                v1 == ID3v1SaveOptions.CREATE:
+            f.write(MakeID3v1(self))
+        else:
+            f.truncate()
+
+    @loadfile(writable=True)
+    def delete(self, filething, delete_v1=True, delete_v2=True):
+        """delete(filething=None, delete_v1=True, delete_v2=True)
+
+        Remove tags from a file.
+
+        Args:
+            filething (filething): A filename or `None` to use the one used
+                when loading.
+            delete_v1 (bool): delete any ID3v1 tag
+            delete_v2 (bool): delete any ID3v2 tag
+
+        If no filename is given, the one most recently loaded is used.
+        """
+
+        delete(filething, delete_v1, delete_v2)
+        self.clear()
+
+
+@convert_error(IOError, error)
+@loadfile(method=False, writable=True)
+def delete(filething, delete_v1=True, delete_v2=True):
+    """Remove tags from a file.
+
+    Args:
+        delete_v1 (bool): delete any ID3v1 tag
+        delete_v2 (bool): delete any ID3v2 tag
+
+    Raises:
+        mutagen.MutagenError: In case deleting failed
+    """
+
+    f = filething.fileobj
+
+    if delete_v1:
+        tag, offset = find_id3v1(f)
+        if tag is not None:
+            f.seek(offset, 2)
+            f.truncate()
+
+    # technically an insize=0 tag is invalid, but we delete it anyway
+    # (primarily because we used to write it)
+    if delete_v2:
+        f.seek(0, 0)
+        idata = f.read(10)
+        try:
+            id3, vmaj, vrev, flags, insize = struct.unpack('>3sBBB4s', idata)
+        except struct.error:
+            pass
+        else:
+            insize = BitPaddedInt(insize)
+            if id3 == b'ID3' and insize >= 0:
+                delete_bytes(f, insize + 10, 0)
+
+
+class ID3FileType(mutagen.FileType):
+    """ID3FileType(filething, ID3=None, **kwargs)
+
+    An unknown type of file with ID3 tags.
+
+    Args:
+        filething (filething): A filename or file-like object
+        ID3 (ID3): An ID3 subclass to use for tags.
+
+    Raises:
+        mutagen.MutagenError: In case loading the file failed
+
+    Load stream and tag information from a file.
+
+    A custom tag reader may be used in instead of the default
+    mutagen.id3.ID3 object, e.g. an EasyID3 reader.
+    """
+
+    __module__ = "mutagen.id3"
+
+    ID3 = ID3
+
+    class _Info(mutagen.StreamInfo):
+        length = 0
+
+        def __init__(self, fileobj, offset):
+            pass
+
+        @staticmethod
+        def pprint():
+            return u"Unknown format with ID3 tag"
+
+    @staticmethod
+    def score(filename, fileobj, header_data):
+        return header_data.startswith(b"ID3")
+
+    def add_tags(self, ID3=None):
+        """Add an empty ID3 tag to the file.
+
+        Args:
+            ID3 (ID3): An ID3 subclass to use or `None` to use the one
+                that used when loading.
+
+        A custom tag reader may be used in instead of the default
+        `ID3` object, e.g. an `mutagen.easyid3.EasyID3` reader.
+        """
+
+        if ID3 is None:
+            ID3 = self.ID3
+        if self.tags is None:
+            self.ID3 = ID3
+            self.tags = ID3()
+        else:
+            raise error("an ID3 tag already exists")
+
+    @loadfile()
+    def load(self, filething, ID3=None, **kwargs):
+        # see __init__ for docs
+
+        fileobj = filething.fileobj
+
+        if ID3 is None:
+            ID3 = self.ID3
+        else:
+            # If this was initialized with EasyID3, remember that for
+            # when tags are auto-instantiated in add_tags.
+            self.ID3 = ID3
+
+        try:
+            self.tags = ID3(fileobj, **kwargs)
+        except ID3NoHeaderError:
+            self.tags = None
+
+        if self.tags is not None:
+            try:
+                offset = self.tags.size
+            except AttributeError:
+                offset = None
+        else:
+            offset = None
+
+        self.info = self._Info(fileobj, offset)
@@ -0,0 +1,176 @@
+# -*- coding: utf-8 -*-
+# Copyright (C) 2005  Michael Urman
+#               2006  Lukas Lalinsky
+#               2013  Christoph Reiter
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+
+import errno
+from struct import error as StructError, unpack
+
+from mutagen._util import chr_, text_type
+
+from ._frames import TCON, TRCK, COMM, TDRC, TALB, TPE1, TIT2
+
+
+def find_id3v1(fileobj):
+    """Returns a tuple of (id3tag, offset_to_end) or (None, 0)
+
+    offset mainly because we used to write too short tags in some cases and
+    we need the offset to delete them.
+    """
+
+    # id3v1 is always at the end (after apev2)
+
+    extra_read = b"APETAGEX".index(b"TAG")
+
+    try:
+        fileobj.seek(-128 - extra_read, 2)
+    except IOError as e:
+        if e.errno == errno.EINVAL:
+            # If the file is too small, might be ok since we wrote too small
+            # tags at some point. let's see how the parsing goes..
+            fileobj.seek(0, 0)
+        else:
+            raise
+
+    data = fileobj.read(128 + extra_read)
+    try:
+        idx = data.index(b"TAG")
+    except ValueError:
+        return (None, 0)
+    else:
+        # FIXME: make use of the apev2 parser here
+        # if TAG is part of APETAGEX assume this is an APEv2 tag
+        try:
+            ape_idx = data.index(b"APETAGEX")
+        except ValueError:
+            pass
+        else:
+            if idx == ape_idx + extra_read:
+                return (None, 0)
+
+        tag = ParseID3v1(data[idx:])
+        if tag is None:
+            return (None, 0)
+
+        offset = idx - len(data)
+        return (tag, offset)
+
+
+# ID3v1.1 support.
+def ParseID3v1(data):
+    """Parse an ID3v1 tag, returning a list of ID3v2.4 frames.
+
+    Returns a {frame_name: frame} dict or None.
+    """
+
+    try:
+        data = data[data.index(b"TAG"):]
+    except ValueError:
+        return None
+    if 128 < len(data) or len(data) < 124:
+        return None
+
+    # Issue #69 - Previous versions of Mutagen, when encountering
+    # out-of-spec TDRC and TYER frames of less than four characters,
+    # wrote only the characters available - e.g. "1" or "" - into the
+    # year field. To parse those, reduce the size of the year field.
+    # Amazingly, "0s" works as a struct format string.
+    unpack_fmt = "3s30s30s30s%ds29sBB" % (len(data) - 124)
+
+    try:
+        tag, title, artist, album, year, comment, track, genre = unpack(
+            unpack_fmt, data)
+    except StructError:
+        return None
+
+    if tag != b"TAG":
+        return None
+
+    def fix(data):
+        return data.split(b"\x00")[0].strip().decode('latin1')
+
+    title, artist, album, year, comment = map(
+        fix, [title, artist, album, year, comment])
+
+    frames = {}
+    if title:
+        frames["TIT2"] = TIT2(encoding=0, text=title)
+    if artist:
+        frames["TPE1"] = TPE1(encoding=0, text=[artist])
+    if album:
+        frames["TALB"] = TALB(encoding=0, text=album)
+    if year:
+        frames["TDRC"] = TDRC(encoding=0, text=year)
+    if comment:
+        frames["COMM"] = COMM(
+            encoding=0, lang="eng", desc="ID3v1 Comment", text=comment)
+    # Don't read a track number if it looks like the comment was
+    # padded with spaces instead of nulls (thanks, WinAmp).
+    if track and ((track != 32) or (data[-3] == b'\x00'[0])):
+        frames["TRCK"] = TRCK(encoding=0, text=str(track))
+    if genre != 255:
+        frames["TCON"] = TCON(encoding=0, text=str(genre))
+    return frames
+
+
+def MakeID3v1(id3):
+    """Return an ID3v1.1 tag string from a dict of ID3v2.4 frames."""
+
+    v1 = {}
+
+    for v2id, name in {"TIT2": "title", "TPE1": "artist",
+                       "TALB": "album"}.items():
+        if v2id in id3:
+            text = id3[v2id].text[0].encode('latin1', 'replace')[:30]
+        else:
+            text = b""
+        v1[name] = text + (b"\x00" * (30 - len(text)))
+
+    if "COMM" in id3:
+        cmnt = id3["COMM"].text[0].encode('latin1', 'replace')[:28]
+    else:
+        cmnt = b""
+    v1["comment"] = cmnt + (b"\x00" * (29 - len(cmnt)))
+
+    if "TRCK" in id3:
+        try:
+            v1["track"] = chr_(+id3["TRCK"])
+        except ValueError:
+            v1["track"] = b"\x00"
+    else:
+        v1["track"] = b"\x00"
+
+    if "TCON" in id3:
+        try:
+            genre = id3["TCON"].genres[0]
+        except IndexError:
+            pass
+        else:
+            if genre in TCON.GENRES:
+                v1["genre"] = chr_(TCON.GENRES.index(genre))
+    if "genre" not in v1:
+        v1["genre"] = b"\xff"
+
+    if "TDRC" in id3:
+        year = text_type(id3["TDRC"]).encode('ascii')
+    elif "TYER" in id3:
+        year = text_type(id3["TYER"]).encode('ascii')
+    else:
+        year = b""
+    v1["year"] = (year + b"\x00\x00\x00\x00")[:4]
+
+    return (
+        b"TAG" +
+        v1["title"] +
+        v1["artist"] +
+        v1["album"] +
+        v1["year"] +
+        v1["comment"] +
+        v1["track"] +
+        v1["genre"]
+    )
--- a/Show More
+++ b/Show More
				`@@ -0,0 +1 @@`
				`Don't change things here, this is a copy of https://github.com/lazka/senf`