Source code for mosqito.sq_metrics.speech_intelligibility.sii_ansi.sii_ansi

# -*- coding: utf-8 -*-

from numpy import array, zeros

from mosqito.sq_metrics.speech_intelligibility.sii_ansi._band_procedure_data import (
    _get_critical_band_data,
    _get_equal_critical_band_data,
    _get_octave_band_data,
    _get_third_octave_band_data,
)
from mosqito.sq_metrics.speech_intelligibility.sii_ansi._speech_data import (
    _get_critical_band_speech_data,
    _get_equal_critical_band_speech_data,
    _get_octave_band_speech_data,
    _get_third_octave_band_speech_data,
)
from mosqito.sq_metrics.speech_intelligibility.sii_ansi._main_sii import _main_sii
from mosqito.sound_level_meter.comp_spectrum import comp_spectrum
from mosqito.sound_level_meter.freq_band_synthesis import freq_band_synthesis


[docs] def sii_ansi(noise, fs, method, speech_level, threshold=None): """Calculate speech intelligibility index This function computes SII values for a noise time signal according to ANSI S3.5 standard. Parameters ---------- noise : array_like Noise time signal in [Pa]. fs: float Sampling frequency of the input noise signal. method: {"critical", "equally_critical", "third_octave", "octave"} Type of frequency band to be used for the calculation. See § 3.4 of the standard. speech_level : {'normal', 'raised', 'loud', 'shout'} Speech level to assess, the corresponding speech spectrum defined in the standard is used for calculation. threshold : array_like or 'zwicker' Threshold of hearing [dB ref. 2e-5 Pa] with same size as the chosen method frequency axis, or 'zwicker' to use the standard threshold. Default to None sets the threshold to zeros on each frequency band. Returns ------- sii: numpy.ndarray Overall SII value. specific_sii: numpy.ndarray Specific SII values along the frequency axis. freq_axis: numpy.ndarray Frequency axis corresponding to the chosen method. See also -------- .sii_ansi_level : Speech intelligibility with an overall SPL level as background noise .sii_ansi_freq : Speech intelligibility with a frequency spectrum as background noise Notes ----- The Speech Intelligibility Index :math:`SII` of the signal is computed as the sum of the speech-to-noise ratio :math:`A` weighted by an importance function :math:`I`, over the :math:`n` frequency bands. .. math:: SII=\\sum_{i=1}^{n}A_{i}I_{i} The number of frequency bands considered depends on the chosen method: * "critical": 21 critical bands corresponding to the Bark scale * "equally_critical": 17 equally contributing critical bands * "third-octave": 18 third-octave bands * "octave": 6 octave bands References ---------- :cite:empty:`SII-ANSI.S3.5:2017` .. bibliography:: :keyprefix: SII- Examples -------- .. plot:: :include-source: >>> from mosqito.sq_metrics.speech_intelligibility import sii_ansi >>> import matplotlib.pyplot as plt >>> import numpy as np >>> fs=48000 >>> d=0.2 >>> dB=90 >>> time = np.arange(0, d, 1/fs) >>> f = 50 >>> stimulus = np.sin(2 * np.pi * f * time) * np.sin(np.pi * f * time) + np.sin(10 * np.pi * f * time) + np.sin(100 * np.pi * f * time) >>> rms = np.sqrt(np.mean(np.power(stimulus, 2))) >>> ampl = 0.00002 * np.power(10, dB / 20) / rms >>> stimulus = stimulus * ampl >>> SII, SII_spec, freq_axis = sii_ansi(stimulus, fs, method='critical', speech_level='normal') >>> plt.plot(freq_axis, SII_spec) >>> plt.xlabel("Frequency [Hz]") >>> plt.ylabel("Specific value ") >>> plt.title("Speech Intelligibility Index = " + f"{SII:.2f}") """ if ( (method != "critical") & (method != "equally_critical") & (method != "third_octave") & (method != "octave") ): raise ValueError( 'Method should be within {"critical", "equally_critical", "third_octave", "octave"}.' ) if ( (speech_level != "normal") & (speech_level != "raised") & (speech_level != "loud") & (speech_level != "shout") ): raise ValueError( 'Speech level should be within {"normal", "raised", "loud", "shout"} to use the corresponding standard data.' ) # Get standard speech spectrum if method == "critical": speech_spectrum, speech_level = _get_critical_band_speech_data(speech_level) CENTER_FREQUENCIES, LOWER_FREQUENCIES, UPPER_FREQUENCIES, _, _, _ = ( _get_critical_band_data() ) elif method == "equally_critical": speech_spectrum, speech_level = _get_equal_critical_band_speech_data( speech_level ) CENTER_FREQUENCIES, LOWER_FREQUENCIES, UPPER_FREQUENCIES, _, _, _ = ( _get_equal_critical_band_data() ) elif method == "third_octave": speech_spectrum, speech_level = _get_third_octave_band_speech_data(speech_level) CENTER_FREQUENCIES, LOWER_FREQUENCIES, UPPER_FREQUENCIES, _, _, _, _ = ( _get_third_octave_band_data() ) elif method == "octave": speech_spectrum, speech_level = _get_octave_band_speech_data(speech_level) ( CENTER_FREQUENCIES, LOWER_FREQUENCIES, UPPER_FREQUENCIES, _, _, _, _, ) = _get_octave_band_data() # Compute noise spectrum in dB spec, freqs = comp_spectrum(noise, fs, nfft="default", window="blackman", db=True) noise_spectrum, _ = freq_band_synthesis( spec, freqs, LOWER_FREQUENCIES, UPPER_FREQUENCIES ) SII, SII_specific, freq_axis = _main_sii( method, speech_spectrum, noise_spectrum, threshold ) return SII, SII_specific, freq_axis