Source code for muspy.metrics.metrics

"""Evaluation metrics."""
import math

import numpy as np
from numpy import ndarray

from ..music import Music


[docs]def n_pitches_used(music: Music) -> int:
    """Return the number of unique pitches used.

    Drum tracks are ignored.

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    int
        Number of unique pitch used.

    See Also
    --------
    :func:`muspy.n_pitch_class_used` :
        Compute the number of unique pitch classes used.

    """
    count = 0
    is_used = [False] * 128
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            if not is_used[note.pitch]:
                is_used[note.pitch] = True
                count += 1
    return count


[docs]def n_pitch_classes_used(music: Music) -> int:
    """Return the number of unique pitch classes used.

    Drum tracks are ignored.

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    int
        Number of unique pitch classes used.

    See Also
    --------
    :func:`muspy.n_pitches_used` :
        Compute the number of unique pitches used.

    """
    count = 0
    is_used = [False] * 12
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            pitch_class = note.pitch % 12
            if not is_used[pitch_class]:
                is_used[pitch_class] = True
                count += 1
    return count


[docs]def pitch_range(music: Music) -> int:
    """Return the pitch range.

    Drum tracks are ignored. Return zero if no note is found.

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    int
        Pitch range.

    """
    if not music.tracks:
        return 0
    if not any(len(track.notes) > 0 for track in music.tracks):
        return 0

    highest = 0
    lowest = 127
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            if note.pitch > highest:
                highest = note.pitch
            if note.pitch < lowest:
                lowest = note.pitch
    return highest - lowest


[docs]def empty_beat_rate(music: Music) -> float:
    r"""Return the ratio of empty beats.

    The empty-beat rate is defined as the ratio of the number of empty
    beats (where no note is played) to the total number of beats. Return
    NaN if song length is zero. This metric is also implemented in
    Pypianoroll [1].

    .. math:: empty\_beat\_rate = \frac{\#(empty\_beats)}{\#(beats)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Empty-beat rate.

    See Also
    --------
    :func:`muspy.empty_measure_rate` :
        Compute the ratio of empty measures.

    References
    ----------
    1. Hao-Wen Dong, Wen-Yi Hsiao, and Yi-Hsuan Yang, “Pypianoroll: Open
       Source Python Package for Handling Multitrack Pianorolls,” in
       Late-Breaking Demos of the 18th International Society for Music
       Information Retrieval Conference (ISMIR), 2018.

    """
    length = max(track.get_end_time() for track in music.tracks)
    if length < 1:
        return math.nan

    n_beats = length // music.resolution + 1
    is_empty = [True] * n_beats
    count = 0
    for track in music.tracks:
        for note in track.notes:
            start = note.time // music.resolution
            end = note.end // music.resolution
            for beat in range(start, end + 1):
                if is_empty[beat]:
                    is_empty[beat] = False
                    count += 1
    return 1 - (count / n_beats)


[docs]def empty_measure_rate(music: Music, measure_resolution: int) -> float:
    r"""Return the ratio of empty measures.

    The empty-measure rate is defined as the ratio of the number of
    empty measures (where no note is played) to the total number of
    measures. Note that this metric only works for songs with a constant
    time signature. Return NaN if song length is zero. This metric is
    used in [1].

    .. math::
        empty\_measure\_rate = \frac{\#(empty\_measures)}{\#(measures)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.
    measure_resolution : int
        Time steps per measure.

    Returns
    -------
    float
        Empty-measure rate.

    See Also
    --------
    :func:`muspy.empty_beat_rate` : Compute the ratio of empty beats.

    References
    ----------
    1. Hao-Wen Dong, Wen-Yi Hsiao, Li-Chia Yang, and Yi-Hsuan Yang,
       "MuseGAN: Multi-track sequential generative adversarial networks
       for symbolic music generation and accompaniment," in Proceedings
       of the 32nd AAAI Conference on Artificial Intelligence (AAAI),
       2018.

    """
    length = max(track.get_end_time() for track in music.tracks)
    if length < 1:
        return math.nan

    n_measures = length // measure_resolution + 1
    is_empty = [True] * n_measures
    count = 0
    for track in music.tracks:
        for note in track.notes:
            start = note.time // measure_resolution
            end = note.end // measure_resolution
            for measure in range(start, end + 1):
                if is_empty[measure]:
                    is_empty[measure] = False
                    count += 1
    return 1 - (count / n_measures)


def _get_pianoroll(music: Music) -> ndarray:
    """Return the binary pianoroll matrix."""
    length = max(track.get_end_time() for track in music.tracks)
    pianoroll = np.zeros((length, 128), bool)
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            pianoroll[note.time : note.end, note.pitch] = 1
    return pianoroll


[docs]def polyphony(music: Music) -> float:
    r"""Return the average number of pitches being played concurrently.

    The polyphony is defined as the average number of pitches being
    played at the same time, evaluated only at time steps where at least
    one pitch is on. Drum tracks are ignored. Return NaN if no note is
    found.

    .. math::
        polyphony = \frac{
            \#(pitches\_when\_at\_least\_one\_pitch\_is\_on)
        }{
            \#(time\_steps\_where\_at\_least\_one\_pitch\_is\_on)
        }

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Polyphony.

    See Also
    --------
    :func:`muspy.polyphony_rate` :
        Compute the ratio of time steps where multiple pitches are on.

    """
    pianoroll = _get_pianoroll(music)
    denominator = np.count_nonzero(pianoroll.sum(1) > 0)
    if denominator < 1:
        return math.nan
    return pianoroll.sum() / denominator


[docs]def polyphony_rate(music: Music, threshold: int = 2) -> float:
    r"""Return the ratio of time steps where multiple pitches are on.

    The polyphony rate is defined as the ratio of the number of time
    steps where multiple pitches are on to the total number of time
    steps. Drum tracks are ignored. Return NaN if song length is zero.
    This metric is used in [1], where it is called `polyphonicity`.

    .. math::
        polyphony\_rate = \frac{
            \#(time\_steps\_where\_multiple\_pitches\_are\_on)
        }{
            \#(time\_steps)
        }

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.
    threshold : int, default: 2
        Threshold of number of pitches to count into the numerator.

    Returns
    -------
    float
        Polyphony rate.

    See Also
    --------
    :func:`muspy.polyphony` :
        Compute the average number of pitches being played at the same
        time.

    References
    ----------
    1. Hao-Wen Dong, Wen-Yi Hsiao, Li-Chia Yang, and Yi-Hsuan Yang,
       "MuseGAN: Multi-track sequential generative adversarial networks
       for symbolic music generation and accompaniment," in Proceedings
       of the 32nd AAAI Conference on Artificial Intelligence (AAAI),
       2018.

    """
    pianoroll = _get_pianoroll(music)
    if len(pianoroll) < 1:
        return math.nan
    return np.count_nonzero(pianoroll.sum(1) > threshold) / len(pianoroll)


def _get_scale(root: int, mode: str) -> ndarray:
    """Return the scale mask for a specific root."""
    if mode == "major":
        c_scale = np.array([1, 0, 1, 0, 1, 1, 0, 1, 0, 1, 0, 1], bool)
    elif mode == "minor":
        c_scale = np.array([1, 0, 1, 1, 0, 1, 0, 1, 1, 0, 1, 0], bool)
    else:
        raise ValueError("`mode` must be either 'major' or 'minor'.")
    return np.roll(c_scale, root)


[docs]def pitch_in_scale_rate(music: Music, root: int, mode: str) -> float:
    r"""Return the ratio of pitches in a certain musical scale.

    The pitch-in-scale rate is defined as the ratio of the number of
    notes in a certain scale to the total number of notes. Drum tracks
    are ignored. Return NaN if no note is found. This metric is used in
    [1].

    .. math::
        pitch\_in\_scale\_rate = \frac{\#(notes\_in\_scale)}{\#(notes)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.
    root : int
        Root of the scale.
    mode : str, {'major', 'minor'}
        Mode of the scale.

    Returns
    -------
    float
        Pitch-in-scale rate.

    See Also
    --------
    :func:`muspy.scale_consistency` :
        Compute the largest pitch-in-class rate.

    References
    ----------
    1. Hao-Wen Dong, Wen-Yi Hsiao, Li-Chia Yang, and Yi-Hsuan Yang,
       "MuseGAN: Multi-track sequential generative adversarial networks
       for symbolic music generation and accompaniment," in Proceedings
       of the 32nd AAAI Conference on Artificial Intelligence (AAAI),
       2018.

    """
    scale = _get_scale(root, mode.lower())
    note_count = 0
    in_scale_count = 0
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            note_count += 1
            if scale[note.pitch % 12]:
                in_scale_count += 1
    if note_count < 1:
        return math.nan
    return in_scale_count / note_count


[docs]def scale_consistency(music: Music) -> float:
    r"""Return the largest pitch-in-scale rate.

    The scale consistency is defined as the largest pitch-in-scale rate
    over all major and minor scales. Drum tracks are ignored. Return NaN
    if no note is found. This metric is used in [1].

    .. math::
        scale\_consistency = \max_{root, mode}{
            pitch\_in\_scale\_rate(root, mode)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Scale consistency.

    See Also
    --------
    :func:`muspy.pitch_in_scale_rate` :
        Compute the ratio of pitches in a certain musical scale.

    References
    ----------
    1. Olof Mogren, "C-RNN-GAN: Continuous recurrent neural networks
       with adversarial training," in NeuIPS Workshop on Constructive
       Machine Learning, 2016.

    """
    max_in_scale_rate = 0.0
    for mode in ("major", "minor"):
        for root in range(12):
            rate = pitch_in_scale_rate(music, root, mode)
            if math.isnan(rate):
                return math.nan
            if rate > max_in_scale_rate:
                max_in_scale_rate = rate
    return max_in_scale_rate


def _get_drum_pattern(res: int, meter: str) -> ndarray:
    """Return the drum pattern mask of a specific meter."""
    drum_pattern = np.zeros(res, dtype=bool)
    drum_pattern[0] = 1
    if meter == "duple":
        if res % 4 == 0:
            drum_pattern[:: (res // 4)] = 1
        if res % 2 == 0:
            drum_pattern[:: (res // 2)] = 1
    elif meter == "triple":
        if res % 3 == 0:
            drum_pattern[:: (res // 3)] = 1
    else:
        raise ValueError("Only duple and triple meters are supported.")
    return drum_pattern


[docs]def drum_in_pattern_rate(music: Music, meter: str) -> float:
    r"""Return the ratio of drum notes in a certain drum pattern.

    The drum-in-pattern rate is defined as the ratio of the number of
    notes in a certain scale to the total number of notes. Only drum
    tracks are considered. Return NaN if no drum note is found. This
    metric is used in [1].

    .. math::
        drum\_in\_pattern\_rate = \frac{
            \#(drum\_notes\_in\_pattern)}{\#(drum\_notes)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.
    meter : str, {'duple', 'triple'}
        Meter of the drum pattern.

    Returns
    -------
    float
        Drum-in-pattern rate.

    See Also
    --------
    :func:`muspy.drum_pattern_consistency` :
        Compute the largest drum-in-pattern rate.

    References
    ----------
    1. Hao-Wen Dong, Wen-Yi Hsiao, Li-Chia Yang, and Yi-Hsuan Yang,
       "MuseGAN: Multi-track sequential generative adversarial networks
       for symbolic music generation and accompaniment," in Proceedings
       of the 32nd AAAI Conference on Artificial Intelligence (AAAI),
       2018.

    """
    drum_pattern = _get_drum_pattern(music.resolution, meter.lower())
    note_count = 0
    in_pattern_count = 0
    for track in music.tracks:
        if not track.is_drum:
            continue
        for note in track.notes:
            note_count += 1
            if drum_pattern[note.time % music.resolution]:
                in_pattern_count += 1
    if note_count < 1:
        return math.nan
    return in_pattern_count / note_count


[docs]def drum_pattern_consistency(music: Music) -> float:
    r"""Return the largest drum-in-pattern rate.

    The drum pattern consistency is defined as the largest
    drum-in-pattern rate over duple and triple meters. Only drum tracks
    are considered. Return NaN if no drum note is found.

    .. math::
        drum\_pattern\_consistency = \max_{meter}{
            drum\_in\_pattern\_rate(meter)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Drum pattern consistency.

    See Also
    --------
    :func:`muspy.drum_in_pattern_rate` :
        Compute the ratio of drum notes in a certain drum pattern.

    """
    drum_in_duple_pattern_rate = drum_in_pattern_rate(music, "duple")
    if math.isnan(drum_in_duple_pattern_rate):
        return math.nan
    drum_in_triple_pattern_rate = drum_in_pattern_rate(music, "triple")

    if drum_in_duple_pattern_rate > drum_in_triple_pattern_rate:
        return drum_in_duple_pattern_rate
    return drum_in_triple_pattern_rate


def _entropy(prob):
    with np.errstate(divide="ignore", invalid="ignore"):
        return -np.nansum(prob * np.log2(prob))


[docs]def pitch_entropy(music: Music) -> float:
    r"""Return the entropy of the normalized note pitch histogram.

    The pitch entropy is defined as the Shannon entropy of the
    normalized note pitch histogram. Drum tracks are ignored. Return NaN
    if no note is found.

    .. math::
        pitch\_entropy = -\sum_{i = 0}^{127}{
            P(pitch=i) \log_2 P(pitch=i)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Pitch entropy.

    See Also
    --------
    :func:`muspy.pitch_class_entropy` :
        Compute the entropy of the normalized pitch class histogram.

    """
    counter = np.zeros(128)
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            counter[note.pitch] += 1
    denominator = counter.sum()
    if denominator < 1:
        return math.nan
    prob = counter / denominator
    return _entropy(prob)


[docs]def pitch_class_entropy(music: Music) -> float:
    r"""Return the entropy of the normalized note pitch class histogram.

    The pitch class entropy is defined as the Shannon entropy of the
    normalized note pitch class histogram. Drum tracks are ignored.
    Return NaN if no note is found. This metric is used in [1].

    .. math::
        pitch\_class\_entropy = -\sum_{i = 0}^{11}{
            P(pitch\_class=i) \times \log_2 P(pitch\_class=i)}

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.

    Returns
    -------
    float
        Pitch class entropy.

    See Also
    --------
    :func:`muspy.pitch_entropy` :
        Compute the entropy of the normalized pitch histogram.

    References
    ----------
    1. Shih-Lun Wu and Yi-Hsuan Yang, "The Jazz Transformer on the Front
       Line: Exploring the Shortcomings of AI-composed Music through
       Quantitative Measures”, in Proceedings of the 21st International
       Society for Music Information Retrieval Conference, 2020.

    """
    counter = np.zeros(12)
    for track in music.tracks:
        if track.is_drum:
            continue
        for note in track.notes:
            counter[note.pitch % 12] += 1
    denominator = counter.sum()
    if denominator < 1:
        return math.nan
    prob = counter / denominator
    return _entropy(prob)


[docs]def groove_consistency(music: Music, measure_resolution: int) -> float:
    r"""Return the groove consistency.

    The groove consistency is defined as the mean hamming distance of
    the neighboring measures.

    .. math::
        groove\_consistency = 1 - \frac{1}{T - 1} \sum_{i = 1}^{T - 1}{
            d(G_i, G_{i + 1})}

    Here, :math:`T` is the number of measures, :math:`G_i` is the binary
    onset vector of the :math:`i`-th measure (a one at position that has
    an onset, otherwise a zero), and :math:`d(G, G')` is the hamming
    distance between two vectors :math:`G` and :math:`G'`. Note that
    this metric only works for songs with a constant time signature.
    Return NaN if the number of measures is less than two. This metric
    is used in [1].

    Parameters
    ----------
    music : :class:`muspy.Music`
        Music object to evaluate.
    measure_resolution : int
        Time steps per measure.

    Returns
    -------
    float
        Groove consistency.

    References
    ----------
    1. Shih-Lun Wu and Yi-Hsuan Yang, "The Jazz Transformer on the Front
       Line: Exploring the Shortcomings of AI-composed Music through
       Quantitative Measures”, in Proceedings of the 21st International
       Society for Music Information Retrieval Conference, 2020.

    """
    length = max(track.get_end_time() for track in music.tracks)
    if measure_resolution < 1:
        raise ValueError("Measure resolution must be a positive integer.")

    n_measures = (length // measure_resolution) + 1
    if n_measures < 2:
        return math.nan

    groove_patterns = np.zeros((n_measures, measure_resolution), bool)

    for track in music.tracks:
        for note in track.notes:
            measure, position = divmod(note.time, measure_resolution)
            if not groove_patterns[measure, position]:
                groove_patterns[measure, position] = 1

    hamming_distance = np.count_nonzero(
        groove_patterns[:-1] != groove_patterns[1:]
    )

    return 1 - hamming_distance / (measure_resolution * (n_measures - 1))