Source code for lib.stream.mp3file

#!/usr/bin/env python3
# MusicDB,  a music manager with web-bases UI that focus on music.
# Copyright (C) 2018  Ralf Stemmer <ralf.stemmer@gmx.net>
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
"""
This module provides a class to read mp3 files frame wise.
Decoding is not part of it.
"""
import sys

BitrateTable = [ # in kilo
            [ # MPEG-2 & 2.5
                [   0,  32,  48,  56,  64,  80,  96, 112, 128, 144, 160, 176, 192, 224, 256, None ], # Layer 1
                [   0,   8,  16,  24,  32,  40,  48,  56,  64,  80,  96, 112, 128, 144, 160, None ], # Layer 2
                [   0,   8,  16,  24,  32,  40,  48,  56,  64,  80,  96, 112, 128, 144, 160, None ]  # Layer 3
            ],                                                                               
                                                                                             
            [ # MPEG-1                                                                  
                [   0,  32,  64,  96, 128, 160, 192, 224, 256, 288, 320, 352, 384, 416, 448, None ], # Layer 1
                [   0,  32,  48,  56,  64,  80,  96, 112, 128, 160, 192, 224, 256, 320, 384, None ], # Layer 2
                [   0,  32,  40,  48,  56,  64,  80,  96, 112, 128, 160, 192, 224, 256, 320, None ]  # Layer 3
            ]
        ]

SamplerateTable = [
            [ 11025, 12000,  8000, None ], # MPEG-2.5
            [  None,  None,  None, None ], # reserved
            [ 22050, 24000, 16000, None ], # MPEG-2
            [ 44100, 48000, 32000, None ], # MPEG-1
        ]

FrameSamplesTable = [
            [  384, 1152,  576, None ], # MPEG-2.5
            [ None, None, None, None ], # reserved
            [  384, 1152,  576, None ], # MPEG-2
            [  384, 1152, 1152, None ]  # MPEG-1
        ]

ModeTable = [ "stereo", "joint stereo", "dual channel", "mono" ]

ModeExtensionTable = [
            [ "4-31", "8-31", "12-31", "16-31" ], # Layer 1
            [ "4-31", "8-31", "12-31", "16-31" ], # Layer 2
            [     "",   "IS",    "MS", "IS+MS" ]  # Layer 3
        ]

EmphaseTable = [ "none", "50/15 ms", "reserved", "CCIT J.17" ]

SlotsizeTable = [ 4, 1, 1, None ]


[docs]class MP3File(object):
    """
    This class allows frame wise reading of an mp3 file.
    This is done by the :meth:`~Frames` generator.
    Beside the mp3 frames the generator returns lots of information extracted from the mp3 Frame Header.    

    The class expects a valid mp3 file (MPEG Layer III) with an valid ID3 Tag (ID3v2.3.0 or ID3v2.4.0).

    Args:
        path (str):
            An absolute path to a valid mp3 file

    Example:
        
        .. code-block:: python

            # ffmpeg -filter_complex aevalsrc=0 -acodec libmp3lame -ab 320k -t 1 silence.mp3

            mp3file = MP3File("./silence.mp3")
            for frame in mp3file.Frames():
                print("=== %5i / %5i ==="%(frame["count"], frame["total"]))
                print(frame["header"])
    """

    def __init__(self, path):
        self.id3tag = None
        self.frames = []
        self.path   = None

        if path:
            self.Load(path)



[docs]    def Load(self, path):
        r"""
        This method loads a new mp3 file.
        All information from the previous file will be discard.

        The method reads the whole file, analyzes each frame, and stores them in memory.
        The ID3 Tag gets also read, but not further processed.

        The following diagram shows how this method loads and processes the mp3 file:

        .. graphviz::

            digraph hierarchy {
                size="5,8"
                start           [label="Start"];

                readid3header   [shape=box,     label="Read ID3 Header"]
                decodeid3size   [shape=box,     label="Decode the length\nof the ID3 Tag"]
                readid3tag      [shape=box,     label="Read ID3 Tag"]

                readmp3header   [shape=box,     label="Read MP3 Frame Header"]
                analyzeheader   [shape=box,     label="Analyze MP3 Frame Header"]
                readmp3frame    [shape=box,     label="Read MP3 Frame"]
                savemp3frame    [shape=box,     label="Store MP3 Frame\nin internal list"]

                end             [label="End"];

                start           -> readid3header
                readid3header   -> decodeid3size
                decodeid3size   -> readid3tag
                readid3tag      -> readmp3header

                readmp3header   -> analyzeheader
                analyzeheader   -> readmp3frame
                readmp3frame    -> savemp3frame
                savemp3frame    -> readmp3header

                readmp3header   -> end              [label="No further data"]
            }


        Args:
            path (str): An absolute path to a valid mp3 file

        Returns:
            *Nothing*

        Raises:
            ValueError: When there are unexpected for invalid information in the given file.
        """
        # a normal and valid ID3 Tag is expected! - there MUST be a Tag!
        # same with mp3 files - this method is made for the cached mp3 files!

        self.path   = path
        self.id3tag = None
        self.frames = []
        with open(self.path, "rb") as mp3:

            # first, read the ID3 tag
            id3header = mp3.read(10)
            if not id3header:
                raise ValueError("Failed reading the first 10 bytes if the ID3Tag (the ID3 Header)")

            if id3header[:3] != b"ID3":
                raise ValueError("ID3Tag expected but missing. First three bytes of the file should be \"ID3\", not \"%s\""%(str(id3header[:3])))

            id3tagsize  = id3header[6]<<21 | id3header[7]<<14 | id3header[8]<<7 | id3header[9]    # decode ID3 size (7bit/byte, LE). Header not count.
            self.id3tag = id3header + mp3.read(id3tagsize)  # the header is not included in the Tag size!
                
            # Now, read all frames
            while True:
                # read the next frame header (4 bytes)
                mp3header = mp3.read(4)
                if not mp3header:
                    break   # end of file

                if mp3header[:2] != b"\xFF\xFB":
                    raise ValueError("Expected Frame Sync Bits missing. First two bytes of the MP3 Frame Header should be \"0xFF 0xFB\", not \"%s\""%(str(mp3header[:2])))

                # Read MP3 Header … done (magic already has all 4 bytes of the header
                infos    = self.AnalyzeHeader(mp3header) # Analyze header
                datasize = infos["framesize"] - 4        # 4 bytes MP3 Frame Header already read, rest are MP3 Frame Data

                # Drop Frame Tag
                mp3frame = mp3header + mp3.read(datasize)
                frame = {}
                frame["frame"] = mp3frame
                frame["header"]= infos
                self.frames.append(frame)



[docs]    def Frames(self):
        """
        This is a generator that returns a frame from the loaded mp3 file and information about that frame.
        
        The returned dictionary contains the following information:

            * ``"frame"`` (bytes): A complete MP3 Frame including the Frame Header and the Frame Data
            * ``"header"`` (dict): The interpretation of the MP3 Frame Header as returned by :meth:`AnalyzeHeader`
            * ``"total"`` (int): The total number of frames in the mp3 file
            * ``"count"`` (int): The number of this frame between ``1`` and ``total``

        Returns:
            A generator that returns a dictionary including a mp3 frame

        Example:

            .. code-block:: python

                mp3file = MP3File("./silence.mp3")
                for frame in mp3file.Frames():
                    print("=== %5i / %5i ==="%(frame["count"], frame["total"]))
                    print(frame["header"])

        """
        total = len(self.frames)

        for count, frame in enumerate(self.frames, 1):
            frame["total"] = total
            frame["count"] = count
            yield frame



[docs]    def AnalyzeHeader(self, header):
        r"""
        This method analyzes a MP3 Frame Header and returns all information that are implicit included in these 4 bytes.
        It is build for the internal use inside this class.

        Primary source for analyzing the header is `mpgedit.org (no HTTPS) <http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html>`_
        Another important source is `Wikipedia <https://en.wikipedia.org/wiki/MP3#Design>`_

        Base of the implementation of this method is from `a python script from Vivake Gupta (vivake AT lab49.com) <https://www.w3.org/2000/10/swap/pim/mp3/mp3info.py>`_
        A further helpful code example comes from `SirNickity from the hydrogenaud.io community <https://hydrogenaud.io/index.php?topic=85125.msg747716#msg747716>`_

        Those codes were improved by me to get information I need.
        These information (and more) are returned as dictionary.
        The returned dictionary contains the following keys:

            * Relevant information:
                * ``"framesize"`` (int): Size of a frame in the MP3 file. This includes the 4 bytes of the MP3 Frame Header.
                * ``"frametime"`` (float): The playtime of the audio in milliseconds that is encoded in one frame
                * ``"layer"`` (int): MPEG layer. For MP3 it should be ``3``
                * ``"mpeg version"`` (int): MPEG version. For MP3, it should be ``1``
            * Further information (I have no idea what some of the information mean. They are simply not relevant anyway.):
                * ``"protection"`` (bool): When ``True`` the header has a CRC16 checksum
                * ``"padding"`` (bool): When ``True`` the frame is padded with an extra slot. (The slot size is given in ``"slotsize"``)
                * ``"private"`` (bool): *free to use*
                * ``"mode"`` (str): Channel mode: ``"stereo"``, ``"joint stereo"``, ``"dual channel"`` or ``"mono"``
                * ``"modeextension"`` (str): For MPEG Layer 1 and 2: ``"4-31"``, ``"8-31"``, ``"12-31"`` or ``"16-31"``. For MPEG Layer 3: ``""`` (empty), ``"IS"``, ``"MS"`` or ``"IS+MS"``. ``"IS"`` stands for *Intensity Stereo Mode*, ``"MS"`` for *MS Stereo Mode*
                * ``"copyright"`` (bool): Copyrighted data
                * ``"original"`` (bool): Original data
                * ``"emphasis"`` (str): One of the following strings: ``"none"``, ``"50/15 ms"``, ``"reserved"`` or ``"CCIT J.17"``
                * ``"samples"`` (int): Samples per frame
                * ``"slotsize"`` (int): The size of one slot
                * ``"bitspersample"`` (int): Bit per sample
                * ``"samplerate"`` (int): Samplerate

        Args:
            header (int/bytes): The 4 byte MP3 Frame Header in bytes, or as integer (unsigned, big endian!)

        Returns:
            A dictionary with all information encoded in the header

        Raises:
            TypeError: When ``header`` is not of type bytes or int.
            ValueError: When there are invalid information encoded in the header.

        Example:

            .. code-block:: python

                # ...
                header = mp3.read(4)

                if header[:2] != b"\xFF\xFB":
                    raise ValueError("Expected Frame Sync Bits missing")
                try:
                    infos = self.AnalyzeHeader(header)
                except ValueError as e:
                    print("Invalid header! Problem: %s"%(str(e)))
                    
        """
        if type(header) == bytes:
            header = int.from_bytes(header, byteorder='big', signed=False)

        if type(header) != int:
            raise TypeError("The argument must be of type bytes, or an integer! Actual type is %s"%(str(type(header))))

        # The comments relate to this article: http://mpgedit.org/mpgedit/mpeg_format/MP3Format.html
        mpeg_version =    (header >> 19) & 3  # BB   00 = MPEG2.5, 01 = res, 10 = MPEG2, 11 = MPEG1  
        layer =           (header >> 17) & 3  # CC   00 = res, 01 = Layer 3, 10 = Layer 2, 11 = Layer 1
        protection_bit =  (header >> 16) & 1  # D    0 = protected, 1 = not protected
        bitrateindex =    (header >> 12) & 15 # EEEE 0000 = free, 1111 = bad
        samplerateindex = (header >> 10) & 3  # F    11 = res
        padding_bit =     (header >> 9)  & 1  # G    0 = not padded, 1 = padded
        private_bit =     (header >> 8)  & 1  # H
        mode =            (header >> 6)  & 3  # II   00 = stereo, 01 = joint stereo, 10 = dual channel, 11 = mono
        mode_extension =  (header >> 4)  & 3  # JJ
        copyright =       (header >> 3)  & 1  # K    00 = not copyrighted, 01 = copyrighted                            
        original =        (header >> 2)  & 1  # L    00 = copy, 01 = original                                          
        emphasis =        (header >> 0)  & 3  # MM   00 = none, 01 = 50/15 ms, 10 = res, 11 = CCIT J.17 

        infos = {}

        # Uncomment to get intermediate values
        #infos["dbg_mpeg_version"]   = mpeg_version
        #infos["dbg_layer"]          = layer
        #infos["dbg_protection_bit"] = protection_bit
        #infos["dbg_bitrateindex"]   = bitrateindex
        #infos["dbg_samplerateindex"]= samplerateindex
        #infos["dbg_padding_bit"]    = padding_bit
        #infos["dbg_private_bit"]    = private_bit
        #infos["dbg_mode"]           = mode
        #infos["dbg_mode_extension"] = mode_extension
        #infos["dbg_copyright"]      = copyright
        #infos["dbg_original"]       = original
        #infos["dbg_emphasis"]       = emphasis

        # Check version
        if mpeg_version == 0:
            infos["mpeg version"] = 2.5
        elif mpeg_version == 2:
            infos["mpeg version"] = 2
        elif mpeg_version == 3:
            infos["mpeg version"] = 1
        else:
            raise ValueError("Invalid MPEG version code. %i ∉ {0,2,3}"%(mpeg_version))

        # Check Layer
        if layer == 1:
            infos["layer"] = 3
        elif layer == 2:
            infos["layer"] = 2
        elif layer == 3:
            infos["layer"] = 1
        else:
            raise ValueError("Invalid MPEG layer code. $i ∉ {1,2,3}"%(layer))

        infos["bitrate"]    = BitrateTable[mpeg_version & 1][infos["layer"] - 1][bitrateindex] * 1000
        infos["samplerate"] = SamplerateTable[mpeg_version][samplerateindex]

        if infos["bitrate"] is None:
            raise ValueError("Invalid bit rate code %i"%(bitrateindex))
        
        if infos["samplerate"] is None:
            raise ValueError("Invalid sample rate code %i"%(samplerateindex))

        infos["protection"]     = not bool(protection_bit)
        infos["padding"]        = bool(padding_bit)
        infos["private"]        = bool(private_bit)
        infos["mode"]           = ModeTable[mode]
        infos["modeextension"]  = ModeExtensionTable[infos["layer"] - 1][mode_extension]
        infos["copyright"]      = bool(copyright)
        infos["original"]       = bool(original)
        infos["emphasis"]       = EmphaseTable[emphasis]
        infos["samples"]        = FrameSamplesTable[mpeg_version][infos["layer"] - 1]
        infos["slotsize"]       = SlotsizeTable[infos["layer"] - 1]
        infos["bitspersample"]  = infos["samples"] / 8.0;
        infos["framesize"]      = (infos["bitspersample"] * infos["bitrate"]) / infos["samplerate"]
        infos["frametime"]      = (infos["samples"] / infos["samplerate"]) * 1000
        if infos["padding"]:
            infos["framesize"] += infos["slotsize"]

        # Frame size must be an integer - it is the size in bytes
        infos["framesize"] = int(infos["framesize"])

        return infos



if __name__ == "__main__":

    mp3file = MP3File("./test2.mp3")
    for frame in mp3file.Frames():
        print("\033[1;35m=== %5i / %5i ===\033[0m"%(frame["count"], frame["total"]))
        print(frame["header"])


# vim: tabstop=4 expandtab shiftwidth=4 softtabstop=4