<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Acoust.</journal-id>
<journal-title>Frontiers in Acoustics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Acoust.</abbrev-journal-title>
<issn pub-type="epub">2813-8082</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1477395</article-id>
<article-id pub-id-type="doi">10.3389/facou.2024.1477395</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Acoustics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Objective quantification of sound sensory attributes in side-by-side vehicles using multiple linear regression models</article-title>
<alt-title alt-title-type="left-running-head">Benghanem et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/facou.2024.1477395">10.3389/facou.2024.1477395</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Benghanem</surname>
<given-names>Abdelghani</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2839633/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Valentin</surname>
<given-names>Olivier</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/611344/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gauthier</surname>
<given-names>Philippe-Aubert</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Berry</surname>
<given-names>Alain</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Groupe d&#x2019;Acoustique De l&#x2019;Universit&#xe9;de Sherbrooke</institution>, <addr-line>Sherbrooke</addr-line>, <addr-line>QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Centre for Interdisciplinary Research in Music</institution>, <institution>Media, and Technology</institution>, <institution>McGill University</institution>, <addr-line>Montr&#xe9;al</addr-line>, <addr-line>QC</addr-line>, <country>Canada</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>&#xc9;cole Des Arts Visuels Et M&#xe9;diatiques</institution>, <institution>Universit&#xe9; Du Qu&#xe9;bec &#xc1; Montr&#xe9;al</institution>, <addr-line>Montr&#xe9;al</addr-line>, <addr-line>QC</addr-line>, <country>Canada</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1364669/overview">Antonio J. Torija Martinez</ext-link>, University of Salford, United Kingdom</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2816083/overview">Zuzanna Podwinska</ext-link>, University of Salford, United Kingdom</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2081126/overview">Wenbo Duan</ext-link>, University of Hertfordshire, United Kingdom</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Olivier Valentin, <email>m.olivier.valentin@gmail.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>10</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>2</volume>
<elocation-id>1477395</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>30</day>
<month>09</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Benghanem, Valentin, Gauthier and Berry.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Benghanem, Valentin, Gauthier and Berry</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The evaluation of sound quality is a pivotal area of research within audio and acoustics. The sound quality evaluation methods commonly used include both objective and subjective, the latter being time-consuming and costly as they rely on listening tests. This research work aims to investigate the use of predictive sound quality models as a way to objectively assess the <italic>Desire-to-buy</italic> of side-by-side vehicles, in a more efficient, faster, and less costly way than conventional methods. Multiple linear regression algorithms were used to validate the objective models derived from objective physical metrics and perceptual psycho-physical metrics. The sensory profile objective models reported in this paper were constructed using parsimonious linear <italic>Lasso</italic> and <italic>Elastic-net</italic> algorithms. Our results show that linear objective models effectively account for each of the perceptual attributes of the sensory profiles and the <italic>Desire-to-buy</italic>, while only requiring a few physical and psychophysical metrics.</p>
</abstract>
<kwd-group>
<kwd>sound quality</kwd>
<kwd>perceptual attributes</kwd>
<kwd>lasso/elastic-net</kwd>
<kwd>sparsity</kwd>
<kwd>objective models</kwd>
<kwd>recreational vehicles</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Acoustic Materials, Noise Control and Sound Perception</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>The evaluation of sound quality is a significant area of research in audio and acoustics (<xref ref-type="bibr" rid="B17">Lyon, 2003</xref>). Traditional methods for assessing vehicle sound quality involve both subjective and objective approaches, often relying on listening tests. However, most objective sound quality models depend on a limited set of pre-selected metrics or simple linear models to predict a single attribute, such as overall sound preference or annoyance. Given the extensive array of available objective metrics, both physical and psychoacoustic, and the advancements in computational tools, there is potential to enhance the number of predictors used in these models.</p>
<p>This study builds on prior work published in Acta Acustica in 2021, exploring the use of objective sound metrics to develop models for sound quality evaluation (<xref ref-type="bibr" rid="B2">Benghanem et al., 2021</xref>). These models complement traditional subjective assessments used in engineering to evaluate vehicle sound signatures. The objective models presented in this paper are designed to benefit Noise, Vibration, and Harshness (NVH) engineers by improving the evaluation of critical sound attributes, thereby optimizing the <italic>Desire-to-buy</italic> factor in vehicle design and marketing.</p>
<p>Specifically, this paper presents models that use objective metrics to predict the sound quality and sound signature of seven recreational side-by-side vehicles (SSVs). The subjective evaluations were gathered through focus group sessions and listening tests conducted with a panel of users, assessing sensory profiles and <italic>Desire-to-buy</italic>. Additionally, the study analyzes perceptual attributes, the <italic>Desire-to-buy</italic> factor, and essential components of sensory profiles identified in previous work (<xref ref-type="bibr" rid="B2">Benghanem et al., 2021</xref>).</p>
<p>Linear regression models based on parsimonious modeling algorithms of multiple linear regression [<italic>Lasso</italic> (<xref ref-type="bibr" rid="B22">Tibshirani, 1996</xref>) and <italic>Elastic-net</italic> (<xref ref-type="bibr" rid="B29">Zou and Hastie, 2005</xref>)] were used to correlate subjective evaluations with objective physical or psychoacoustic metrics.</p>
<p>
<xref ref-type="sec" rid="s2">Section 2</xref> provides a detailed review of the thematic literature and theoretical background. <xref ref-type="sec" rid="s3">Section 3</xref> outlines the methodological aspects. Results are presented in <xref ref-type="sec" rid="s4">Section 4</xref> and discussed in <xref ref-type="sec" rid="s5">Section 5</xref>. Conclusions and future directions are discussed in <xref ref-type="sec" rid="s6">Section 6</xref>.</p>
</sec>
<sec id="s2">
<title>2 Background in sound quality evaluation and prediction</title>
<p>Within the industry, it is difficult to obtain a subjective assessment of the interior noise of a vehicle to characterize the sound comfort or other sound quality. Indeed, this is often a time-consuming and expensive task. Therefore, industry and researchers in acoustics and vibration tend to favor objective evaluations. In the field of acoustics, an objective evaluation consists of determining the characteristics of acoustic stimuli via objective metrics and physical measurements. Subsequently, these metrics can be used to predict subjective evaluation (<xref ref-type="bibr" rid="B14">Kwon et al., 2018</xref>; <xref ref-type="bibr" rid="B16">Lee, 2008</xref>).</p>
<p>Many research works have been conducted on the sound quality of vehicles, mostly for automobiles (<xref ref-type="bibr" rid="B19">Otto et al., 2001</xref>; <xref ref-type="bibr" rid="B4">Chen and Wang, 2014</xref>; <xref ref-type="bibr" rid="B13">Kim et al., 2009</xref>). To the authors&#x2019; knowledge, no similar studies have been conducted to cover SSVs, aside from the 2021 study published in Acta Acustica (<xref ref-type="bibr" rid="B2">Benghanem et al., 2021</xref>), upon which this research builds. Unlike automobiles, SSVs are all-terrain utility vehicles used for heavy-duty work, which requires a sound that conveys both a sense of power and efficiency. Therefore, the research findings obtained with automobiles are not directly transferable to SSVs.</p>
<p>In the early days of sound quality research and development, the physical metrics used for objective sound evaluation were sound power, loudness, pressure level, and frequency-weighted sound pressure levels [dB (A), dB (C), etc.]. Over time, industry and researchers found that the pressure level weights were not sufficient to fully explain the human auditory perception of products. Psychoacoustics studies (the study of the relationship between the physical properties of sound and auditory perception in humans, using the physiology of the ears and the mechanisms of sound coding by human hearing) led to the development of psychoacoustic indicators (sound metrics) in several areas of audio and music. These indicators make it possible to describe the various auditory aspects of sounds (<xref ref-type="bibr" rid="B7">Fastl and Zwicker, 2007</xref>; <xref ref-type="bibr" rid="B28">Zhekova, 2007</xref>).</p>
<p>The psychoacoustic metrics developed to assess the sound quality of vehicles are numerous; they include loudness, acuity, roughness, fluctuation, pitch, and timbre. However, most of these metrics were historically introduced in an attempt to predict the annoyance of sounds and noise, not the desirability of a sound (<xref ref-type="bibr" rid="B7">Fastl and Zwicker, 2007</xref>; <xref ref-type="bibr" rid="B28">Zhekova, 2007</xref>; <xref ref-type="bibr" rid="B13">Kim et al., 2009</xref>). Thus, these usual metrics are not necessarily suitable for the research question of this study, and more suitable ones need to be found.</p>
<p>In parallel, some research endeavors have led to metrics for information extraction from music and its applications. This interdisciplinary research area is known as &#x201c;Music Information Retrieval&#x201d; (MIR) in the context of massive data and online file sharing. The MIR technique is basically designed for music data but can be extended to other types of audio information (<xref ref-type="bibr" rid="B15">Lartillot, 2014</xref>; <xref ref-type="bibr" rid="B5">Choi. et al., 2017</xref>; <xref ref-type="bibr" rid="B21">Rumsey, 2009</xref>; <xref ref-type="bibr" rid="B6">Downie, 2003</xref>). Other psychoacoustic metrics have been developed in music and signal processing applied to music, taking into account several aspects of sound (tonal, temporal, rhythmic, harmonic, timbre, pitch, etc.). These psychoacoustic metrics constitute a dataset of descriptors for audio analysis in the field of information retrieval, a field that has received a lot of attention in recent years in the context of massive data and machine learning (<xref ref-type="bibr" rid="B24">Urbano and Serra, 2013</xref>).</p>
<p>The field of MIR is defined as the extraction of information from music and its applications. Since music refers to audio content, the scope of MIR extends to other types of music information, for example, lyrics, music metadata, or the user&#x2019;s listening history (<xref ref-type="bibr" rid="B5">Choi. et al., 2017</xref>; <xref ref-type="bibr" rid="B6">Downie, 2003</xref>). MIR is the technology behind systems capable of searching, analyzing, and recommending audio content (<xref ref-type="bibr" rid="B21">Rumsey, 2009</xref>).</p>
<p>Despite the possibility of using this technique for the analysis of other non-musical sounds, there are no publications or applications that aim to study sound quality in industry using MIR. Therefore, this study aims to exploit and adapt MIR metric extraction software and libraries (cited above) to extract the key feature of the sound signature of recreational vehicle sounds.</p>
<sec id="s2-1">
<title>2.1 Building predictive sound quality</title>
<p>Recently, sound quality assessment using subjective measures has focused on identifying sound quality metrics that can predict subjective responses. The goal is to design a numerical prediction model that can replace listening tests. In practice, it then becomes possible to predict the sound quality perception of a panel of representative users for a new sound or a new sound design.</p>
<p>The principle is to link the detailed explanation of the properties of the sound (subjective evaluation) with the psychoacoustic indicators of the stimuli used in listening tests (objective evaluation). Two types of approaches are used for the objective prediction of sound quality.</p>
<p>The first approach involves correlation and regression analyses using a pool of preselected metrics that can provide meaningful models for engineers. Most of the research reported in the literature on the creation of objective models of sound quality is based on the theory of multiple linear regression (<xref ref-type="bibr" rid="B19">Otto et al., 2001</xref>; <xref ref-type="bibr" rid="B14">Kwon et al., 2018</xref>; <xref ref-type="bibr" rid="B12">Jiang and Zeng, 2014</xref>).</p>
<p>The second approach leverages recent advancements in machine learning and deep learning. For instance, Huang et al. demonstrated that convolutional neural networks (CNN) can be used for the sound quality prediction of interior noise (<xref ref-type="bibr" rid="B11">Huang et al., 2020</xref>). Other neural networks have been applied to sound quality prediction, including back propagation neural networks (BPNN) (<xref ref-type="bibr" rid="B10">Huang et al., 2021</xref>), radial basis function (RBF) neural networks (<xref ref-type="bibr" rid="B27">Xiong et al., 2015</xref>), or even genetic algorithms (<xref ref-type="bibr" rid="B3">Chen et al., 2022</xref>). However, despite the promise of these approaches, their practical application in product design to improve sound quality perception remains challenging (<xref ref-type="bibr" rid="B16">Lee, 2008</xref>; <xref ref-type="bibr" rid="B20">Paulraj et al., 2013</xref>; <xref ref-type="bibr" rid="B25">Wang et al., 2014</xref>) because the integration of machine learning and neural network models into the product design process often requires extensive and high-quality training data, which may not always be available or easy to obtain.</p>
<p>This paper presents an attempt to overcome these polarized limitations by seeking a realistic and pragmatic in-between solution that can be used by NVH engineers without requiring extensive and high-quality training data.</p>
</sec>
<sec id="s2-2">
<title>2.2 Linear regression</title>
<p>The linear regression method is based on a least-square (LS) approach that minimizes the prediction error. However, as with any classical LS solution to a problem with many potential predictors, all the predictor coefficients will be part of the solution, which can lead to overfitting. To address this issue and to produce a more parsimonious predictive model, more advanced methods adapted to the problem of sound quality have been developed (<xref ref-type="bibr" rid="B9">Gauthier et al., 2017</xref>). For instance, techniques such as regularization are used to simplify the model by performing a pseudo-inversion of the matrix of potential predictors, thereby selecting only the most relevant predictors.</p>
<p>Parsimonious models are preferred due to their simplicity, interpretability, and reduced risk of overfitting, allowing for a better understanding of data and more efficient, generalizable, and computationally manageable analyses. In this research work, the authors investigated parsimonious selection and extraction of sound quality/significance predictors using <italic>Lasso/Elastic-net</italic> (<xref ref-type="bibr" rid="B22">Tibshirani, 1996</xref>; <xref ref-type="bibr" rid="B29">Zou and Hastie, 2005</xref>) and <italic>Group-Lasso</italic> (<xref ref-type="bibr" rid="B23">Tibshirani and Taylor, 2011</xref>). The <italic>Lasso</italic> corresponds to a convex optimal problem with regularization of the 1-norm of the solution. The <italic>Elastic-net</italic> is a convex minimization problem with a weighted regularization of the 2-norm and 1-norm of the solution. Finally, the <italic>Group-Lasso</italic> is a structured parsimony approach that promotes inter-group parsimony via the 1-norm of the 2-norm of the (predefined) predictor groups (<xref ref-type="bibr" rid="B8">Friedman et al., 2010</xref>).</p>
<p>Despite its effectiveness in many applications, <italic>Lasso</italic> regressions, introduced by Tibshirani (<xref ref-type="bibr" rid="B22">Tibshirani, 1996</xref>), are known to have some limitations. Mainly, if there is a group of highly correlated predictors, the <italic>Lasso</italic> tends to select only any one of these predictors in the group. The <italic>Elastic-net</italic> approach proposed by Zou and Hastie (<xref ref-type="bibr" rid="B29">Zou and Hastie, 2005</xref>) is a variant of the <italic>Lasso</italic> regression. It improves the <italic>Lasso</italic> predictions and enhances the ability to do grouped selection. The <italic>Lasso</italic> and <italic>Elastic Net</italic> approaches used in this research work incorporate cross-validation steps, ensuring the selection of optimal models and reducing the risk of overfitting (see <xref ref-type="sec" rid="s3">Section 3.2</xref>). This cross-validation process enhances the reliability of the predictive models for sound quality assessment.</p>
</sec>
</sec>
<sec id="s3">
<title>3 Data and method</title>
<p>The objective models in this paper were built using listening test data from seven existing recreational vehicles, assessed across three driving conditions (idle, constant speed at 30&#xa0;km/h, acceleration from 0 to 60&#xa0;km/h), extensively detailed in a prior study (<xref ref-type="bibr" rid="B2">Benghanem et al., 2021</xref>). Given that SSVs typically operate at speeds below 30&#xa0;km/h for 95% of their operating time, and that acceleration reflects the sensation associated with vehicle sportiveness, the constant speed and acceleration conditions were chosen for constructing the objective models.</p>
<p>These models aim to predict scores from the constant speed and acceleration conditions, provided by twenty participants, on six sensory attributes (<italic>Aggressive</italic>, <italic>Noisy</italic>, <italic>Soft</italic>, <italic>Metallic</italic>, <italic>Powerful</italic>, <italic>Vibrating</italic>) rated from 0% to 100%. Additionally, the models also aim to predict <italic>Desire-to-buy</italic> scores and the first two principal components (PC1 and PC2) derived from Principal Component Analysis (PCA) of sensory attributes. As detailed in (<xref ref-type="bibr" rid="B2">Benghanem et al., 2021</xref>), PC1 reflects the perceived powerfulness of the vehicle (<italic>Metallic</italic>/<italic>Powerful</italic>), while PC2 represents the perceived softness (<italic>Aggressive</italic>/<italic>Soft</italic>). Collectively, PC1 and PC2 retain 69% of the total variance in the initial data for the constant speed condition (see <xref ref-type="fig" rid="F1">Figure 1</xref>) and 72% for the acceleration condition (see <xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Loadings on the first two Principal Components of the sensory profile (PC1, PC2) for the constant speed condition. Reprinted from: &#x201c;Sound quality of side-by-side vehicles: Investigation of multidimensional sensory profiles and loudness equalization in an industrial context,&#x201d; by A. <xref ref-type="bibr" rid="B2">Benghanem et al. (2021)</xref> Acta Acustica, 5 (7), page 17. doi: 10.1051/527aacus/2020032 publisher: EDP Sciences.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g001.tif"/>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Loadings on the first two Principal Components of the sensory profile (PC1, PC2) for the acceleration condition.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g002.tif"/>
</fig>
<p>Data from the listening test were global loudness equalized to avoid overestimating loudness in the predictions and to ensure a finer analysis of the timbre structure of the sound for example.</p>
<sec id="s3-1">
<title>3.1 Predictors</title>
<p>Two families of metrics were used as predictors: 1) physical and psychoacoustic metrics, hereafter referred to as engineering metrics, and 2) the metrics from the MIR (Music Information Retrieval) library used for the extraction of audio and musical characteristics from digital audio files. Among the engineering metrics, the global loudness in sone, the specific loudness on the Bark scale in the 24 frequency bands between 20&#xa0;Hz and 1,550&#xa0;Hz, the fluctuation strength, the sound pressure level in dB of the third-octave band spectrum in the 29 frequency bands between 20&#xa0;Hz and 16,000&#xa0;Hz, roughness and sharpness were chosen. The MIR metrics used in this research project come from the library <italic>MIRtoolbox</italic> 1.6.1 for Matlab (<xref ref-type="bibr" rid="B15">Lartillot, 2014</xref>). These metrics are grouped into categories: tonality, timbre, rhythm, dynamics, and pitch.</p>
<p>Three statistical variants of each of the metrics were calculated and used as predictors: the mean value over the time duration of the sound sample (Mean), the standard deviation (Std), and the slope over time (Slope). The slope is defined as the linear trend along frames, which is the derivative of the line that best fits the curve. Specifically, the slope <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is computed using a normalized representation of the curve <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>&#x2014;centered, with unit variance, and scaled to a temporal series <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> of values between 0 and 1. This is solved as a least-squares solution to the equation <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. The choice of using such metrics is motivated by the need to include significant variables, such as the slope, for acceleration sounds (time-varying signals).</p>
<p>For metric calculation and and their variants, the signal was decomposed into frames, with a frame length of 50&#xa0;ms and 50% overlap for the MIR metrics, and a 30&#xa0;ms frame length for the engineering metrics. This frame-based analysis enables the extraction of metrics that are representative of the signal&#x2019;s composition in both the time and spectral domains, ensuring an accurate capture of its characteristics.</p>
<p>Specific loudness and global loudness values were calculated according to the ISO532B model for stationary sounds (<xref ref-type="bibr" rid="B31">Zwicker et al., 1991</xref>) (for constant speed and idle) and according to the model of (<xref ref-type="bibr" rid="B30">Zwicker and Fastl, 1999</xref>) for non-stationary sounds (acceleration). Also, the value of the sharpness of a sound, and the value of variable sharpness in time, were calculated according to the procedure proposed by Fastl (derived from Zwicker) with the correction of (<xref ref-type="bibr" rid="B1">Aures, 1985</xref>). A total number of 182 metrics (engineering, MIR, including variants for non-stationary signals) were available in the bank of potential model candidates. The temporal variations of the metrics for stationary sounds (idle, constant speed) were then removed, resulting in a total of 127 metrics for these two stationary conditions.</p>
</sec>
<sec id="s3-2">
<title>3.2 Lasso and elastic-net</title>
<p>The linear model used to create sound quality models is defined in matrix form and indices:<disp-formula id="e1">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>with <inline-formula id="inf5">
<mml:math id="m6">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the ith component of the vector of scores obtained by listening test statistics (<inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:mi>I</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> sounds), <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the ith component of the matrix of metrics or scalar measures of <inline-formula id="inf8">
<mml:math id="m9">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> potential predictors for the <inline-formula id="inf9">
<mml:math id="m10">
<mml:mrow>
<mml:mi>I</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> sounds, <inline-formula id="inf10">
<mml:math id="m11">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the coefficients to be solved as a vector (linear regression coefficients), <inline-formula id="inf11">
<mml:math id="m12">
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> the intercept (the score when all the coefficients <inline-formula id="inf12">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are null) and <inline-formula id="inf13">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the prediction errors for each ith sound. <xref ref-type="disp-formula" rid="e1">Equation 1</xref> can be solved using linear regression. In the case of <italic>wide data</italic> with much fewer observations than predictive metrics <inline-formula id="inf14">
<mml:math id="m15">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, classical linear regression based on a least-square approach will typically achieve over-fitting and all the coefficients <inline-formula id="inf15">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> will be nonzero. As mentioned in the introduction, this strongly limits the interpretation of the resulting model for any engineering use or design guidelines. The aim of the <italic>Lasso</italic> and <italic>Elastic-net</italic> is to circumvent this issue by rewriting the problem as a composite cost function (<xref ref-type="bibr" rid="B22">Tibshirani, 1996</xref>):<disp-formula id="e2">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>I</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>I</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3bb;</mml:mi>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:munderover>
</mml:mstyle>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:msubsup>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">&#x7c;</mml:mo>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
</p>
<p>The first right-hand side term corresponds to the quadratic sum of the predictor errors and the second right-hand side term is a regularization term with regularization amount <inline-formula id="inf16">
<mml:math id="m18">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. The regularization combines 2-norm regularization <inline-formula id="inf17">
<mml:math id="m19">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and 1-norm regularization <inline-formula id="inf18">
<mml:math id="m20">
<mml:mrow>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">&#x7c;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> based on the <italic>Elastic-net</italic> parameter <inline-formula id="inf19">
<mml:math id="m21">
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. For the <italic>Lasso</italic>, <inline-formula id="inf20">
<mml:math id="m22">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, only the 1-norm regularization is included. This induces solution sparsity, i.e., few coefficients <inline-formula id="inf21">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> will be non-zero and will be therefore selected in the model (<xref ref-type="bibr" rid="B22">Tibshirani, 1996</xref>). The sparsity is controlled by the regularization amount <inline-formula id="inf22">
<mml:math id="m24">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. The <italic>Elastic-net</italic> (<xref ref-type="bibr" rid="B29">Zou and Hastie, 2005</xref>) involves <inline-formula id="inf23">
<mml:math id="m25">
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and will typically smooth out the selection towards the extreme case of 2-norm-only regularization with <inline-formula id="inf24">
<mml:math id="m26">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (this corresponds to Tikhonov regularization). The minimum of the composite cost function cannot be found by analytical means since it is nonlinear. Therefore, this is solved iteratively using coordinate descent algorithms (<xref ref-type="bibr" rid="B26">Wright, 2015</xref>). In <xref ref-type="disp-formula" rid="e2">Equation 2</xref>, <inline-formula id="inf25">
<mml:math id="m27">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is a user-selected parameter. Note that in the following, to create the simplest and parsimonious models, only the <italic>Lasso</italic> results are shown <inline-formula id="inf26">
<mml:math id="m28">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. The penalization amount <inline-formula id="inf27">
<mml:math id="m29">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is set rigorously using the following procedure: The experimenter defines a limit on the maximum number of metrics that should be included in the model. Here, the aim is to make sure that the model is readable and is meaningful for engineers that can latter use it for product modification. Next, the problem is solved for a wide range of <inline-formula id="inf28">
<mml:math id="m30">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> starting with the largest <inline-formula id="inf29">
<mml:math id="m31">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> so that all coefficients <inline-formula id="inf30">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are zeros, and decreasing in successive iterations. The <inline-formula id="inf31">
<mml:math id="m33">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> iteration stops if: 1) the maximum number of non-zero coefficients <inline-formula id="inf32">
<mml:math id="m34">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is reached or 2) the minimum prediction error is obtained for <inline-formula id="inf33">
<mml:math id="m35">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-fold cross-validation of the prediction. Cross-validation is used to avoid overfitting of the model. In this paper, the maximum number of predictive metrics is 7 and the cross-validation is 5-fold.</p>
<p>Cross-validation is a statistical technique used in machine learning and model evaluation. It involves dividing a dataset into subsets, typically a training set to build a predictive model and a validation set to assess its performance. This process is repeated multiple times, each time with a different subset as the validation set and the rest as the training set. The results are then averaged, providing a robust estimate of the model&#x2019;s performance, helping to mitigate overfitting, and ensuring the model&#x2019;s generalizability to unseen data. Cross-validation is crucial for selecting the best model and optimizing its hyperparameters while avoiding data leakage and providing a more accurate assessment of predictive performance.</p>
<p>Note that in this study, all seven sounds were retained for the training of the models. While this approach may limit our ability to test the predictive power of the models on new sounds, it is important to highlight that this was not a primary focus or requirement of the study. As a reminder, the main objective of this research is to develop simple objective models that can provide an objective understanding of the measured sounds of side-by-side vehicles. By including all available sounds in the training dataset, we aimed to capture the full range of sound characteristics and ensure a comprehensive analysis within the scope of this study.</p>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>4 Results</title>
<p>
<xref ref-type="table" rid="T1">Tables 1</xref>, <xref ref-type="table" rid="T2">2</xref> present the objective models derived from <italic>Lasso</italic> respectively for the constant speed and the acceleration conditions to predict each perceptual attribute (<italic>Powerful</italic>, <italic>Aggressive</italic>, <italic>Metallic</italic>, <italic>Soft</italic>, <italic>Vibrating</italic>, and <italic>Noisy</italic>), the overall <italic>Desire-to-Buy</italic>, and the two principal components of the six-dimension sensory profiles of recreational vehicles sounds. The description of the predictors selected in these models can be found in <xref ref-type="table" rid="T3">Table 3</xref>. <xref ref-type="fig" rid="F3">Figure 3</xref> presents the listening tests responses and the responses&#x2019; prediction of the <italic>Powerful</italic> attribute for SSV sounds for constant speed condition, as an example.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>
<italic>Lasso</italic> model results for the constant speed condition. The number of predictors selected from the 127 available metrics <inline-formula id="inf34">
<mml:math id="m36">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">Predictors</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> used to build the <italic>Lasso</italic> models is shown in the second column. The estimated coefficients <inline-formula id="inf35">
<mml:math id="m37">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> of each predictor are listed in parenthesis. The description of the predictors can be found in <xref ref-type="table" rid="T3">Table 3</xref>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center"/>
<th align="center">
<inline-formula id="inf36">
<mml:math id="m38">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">Predictors</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">Predictors&#x2019; name <inline-formula id="inf37">
<mml:math id="m39">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">model <italic>p</italic>-value</th>
<th align="center">Model adjusted R-squared</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Powerful</td>
<td align="center">3</td>
<td align="center">N&#x2032; B4 (6.78); N&#x2032; B14 (&#x2212;3.02); L 3 October 4,000 (&#x2212;2.58)</td>
<td align="center">0.0152</td>
<td align="center">0.91</td>
</tr>
<tr>
<td align="left">Aggressive</td>
<td align="center">1</td>
<td align="center">Rollof85 Std (&#x2212;12.36)</td>
<td align="center">0.0016</td>
<td align="center">0.86</td>
</tr>
<tr>
<td align="left">Metallic</td>
<td align="center">2</td>
<td align="center">N&#x2032; B5 (&#x2212;8.69); N&#x2032; B16 (5.01)</td>
<td align="center">0.0107</td>
<td align="center">0.84</td>
</tr>
<tr>
<td align="left">Soft</td>
<td align="center">2</td>
<td align="center">L 3October 63 (3.53); Rollof95 Slope (&#x2212;5.94)</td>
<td align="center">0.0005</td>
<td align="center">0.97</td>
</tr>
<tr>
<td align="left">Vibrating</td>
<td align="center">3</td>
<td align="center">L 3October 200 (4.24); L 3 October 1,000 (&#x2212;3.14); Rhythm Attack Slope (&#x2212;4.35)</td>
<td align="center">0.0333</td>
<td align="center">0.85</td>
</tr>
<tr>
<td align="left">Noisy</td>
<td align="center">2</td>
<td align="center">Brightness Std (&#x2212;2.33); Rollof85 Std (&#x2212;2.25)</td>
<td align="center">0.0011</td>
<td align="center">0.95</td>
</tr>
<tr>
<td align="left">Desire-to-Buy</td>
<td align="center">2</td>
<td align="center">N&#x2032; B17 (&#x2212;3.89); L 3October 63 (4.45)</td>
<td align="center">0.0249</td>
<td align="center">0.88</td>
</tr>
<tr>
<td align="left">PC1</td>
<td align="center">2</td>
<td align="center">L 3 October 4,000 (1.02); Rollof 85 Std (0.78)</td>
<td align="center">0.0158</td>
<td align="center">0.81</td>
</tr>
<tr>
<td align="left">PC2</td>
<td align="center">2</td>
<td align="center">L 3 October 40 (&#x2212;0.47); Rollof 95 Slope (0.64)</td>
<td align="center">0.0062</td>
<td align="center">0.88</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>
<italic>Lasso</italic> model results for the acceleration condition. The number of predictors selected from the 127 available metrics <inline-formula id="inf38">
<mml:math id="m40">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">Predictors</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> used to build the <italic>Lasso</italic> models is shown in the second column. The estimated coefficients <inline-formula id="inf39">
<mml:math id="m41">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> of each predictor are listed in parenthesis. The description of the predictors can be found in <xref ref-type="table" rid="T3">Table 3</xref>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center"/>
<th align="center">
<inline-formula id="inf40">
<mml:math id="m42">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">Predictors</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">Predictors&#x2019; name <inline-formula id="inf41">
<mml:math id="m43">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">model <italic>p</italic>-value</th>
<th align="center">Model adjusted R-squared</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Powerful</td>
<td align="center">1</td>
<td align="center">N&#x2032; B11 Slope (19.54)</td>
<td align="center">0.0005</td>
<td align="center">0.91</td>
</tr>
<tr>
<td align="left">Aggressive</td>
<td align="center">2</td>
<td align="center">N&#x2032; B11 Slope (4.22); N&#x2032; B12 Slope (13.18)</td>
<td align="center">0.0038</td>
<td align="center">0.91</td>
</tr>
<tr>
<td align="left">Metallic</td>
<td align="center">2</td>
<td align="center">Rollof85 Mean (7.78); L 3October 3,150 (7.70)</td>
<td align="center">0.0092</td>
<td align="center">0.86</td>
</tr>
<tr>
<td align="left">Soft</td>
<td align="center">2</td>
<td align="center">L 3October 80 (2.90); Sharpness Std (&#x2212;3.43)</td>
<td align="center">0.0009</td>
<td align="center">0.95</td>
</tr>
<tr>
<td align="left">Vibrating</td>
<td align="center">1</td>
<td align="center">N&#x2032; B6 Slope (10.32)</td>
<td align="center">0.0026</td>
<td align="center">0.83</td>
</tr>
<tr>
<td align="left">Noisy</td>
<td align="center">1</td>
<td align="center">N&#x2032; B14 Std (5.61)</td>
<td align="center">0.0069</td>
<td align="center">0.76</td>
</tr>
<tr>
<td align="left">Desire-to-Buy</td>
<td align="center">2</td>
<td align="center">N&#x2032; B11 Slope (7.08); N&#x2032; B12 Slope (11.62)</td>
<td align="center">0.0288</td>
<td align="center">0.75</td>
</tr>
<tr>
<td align="left">PC1</td>
<td align="center">1</td>
<td align="center">N&#x2032; B11 Slope (1.54)</td>
<td align="center">0.0028</td>
<td align="center">0.83</td>
</tr>
<tr>
<td align="left">PC2</td>
<td align="center">2</td>
<td align="center">N&#x2032; B16 Std (0.59); Spectral Flatness Slope (0.70)</td>
<td align="center">0.0024</td>
<td align="center">0.93</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Description of the predictors used for constructing the <italic>Lasso</italic> models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Metrics</th>
<th align="left">Descriptions</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">N&#x2032; B4</td>
<td align="left">Specific loudness in the 4th critical band (300&#xa0;Hz&#x2013;400&#xa0;Hz)</td>
</tr>
<tr>
<td align="left">N&#x2032; B5</td>
<td align="left">Specific loudness in the 5th critical band (400&#xa0;Hz&#x2013;510&#xa0;Hz)</td>
</tr>
<tr>
<td align="left">N&#x2032; B14</td>
<td align="left">Specific loudness in the 14th critical band (2,000&#xa0;Hz&#x2013;2,320&#xa0;Hz)</td>
</tr>
<tr>
<td align="left">N&#x2032; B16</td>
<td align="left">Specific loudness in the 16th critical band (2,700&#xa0;Hz&#x2013;3,150&#xa0;Hz)</td>
</tr>
<tr>
<td align="left">N&#x2032; B17</td>
<td align="left">Specific loudness in the 17th critical band (3,150&#xa0;Hz&#x2013;3,700&#xa0;Hz)</td>
</tr>
<tr>
<td align="left">L 3oct XX</td>
<td align="left">Sound pressure level in dB in the 1/3 octave band centered at XX Hz</td>
</tr>
<tr>
<td align="left">Roll of YY</td>
<td align="left">Corresponds to the frequency below which YY % of the total signal energy is contained (i.e., the cutoff frequency where the accumulated energy of the signal reaches YY % of its total value)</td>
</tr>
<tr>
<td align="left">Brightness</td>
<td align="left">Sound brightness</td>
</tr>
<tr>
<td align="left">Sharpness</td>
<td align="left">Sharpness of the sound (acuity)</td>
</tr>
<tr>
<td align="left">Spectral Flatness</td>
<td align="left">Also known as Wiener entropy, which is a measure of the width and uniformity of the power spectrum</td>
</tr>
<tr>
<td align="left">Rhythm Attack Slope</td>
<td align="left">Ratio between the difference in magnitude at the beginning and end of the attack period, and the corresponding time difference</td>
</tr>
<tr>
<td align="left">Slope, Mean, Std</td>
<td align="left">Statistics (over time): Slope, Mean, and Standard Deviation respectively</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Responses and prediction of responses of the <italic>Powerful</italic> attribute for SSV sounds for constant speed condition. The thick bars (in blue) indicate the responses and the thinner bars (in red) indicate the model predictions. The horizontal axis labels (V1, V2, etc.) correspond to individual vehicles. The model&#x2019;s fit, represented by the coefficient of determination <inline-formula id="inf42">
<mml:math id="m44">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0.96</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, is shown in the legend.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g003.tif"/>
</fig>
<sec id="s4-1">
<title>4.1 Models&#x2019; prediction for the constant speed condition</title>
<p>As can be seen in <xref ref-type="table" rid="T1">Table 1</xref>, the <italic>Lasso</italic> models were able to predict the <italic>Powerful</italic> attribute with a coefficient of determination of 91% using only three predictors, the <italic>Aggressive</italic> attribute with a coefficient of determination of 86% using only one predictor, the <italic>Metallic</italic> attribute with a coefficient of determination of 84% using only two predictors, the <italic>Soft</italic> attribute with a coefficient of determination of 97% using only two predictors, the <italic>Vibrating</italic> attribute with a coefficient of determination of 85% using only three predictors, the <italic>Noisy</italic> attribute with a coefficient of determination of 95% using only two predictors, and the overall <italic>Desire-to-Buy</italic> with a coefficient of determination of 88% using only two predictors. The models derived from <italic>Lasso</italic> were also able to predict the average scores of PC1 with a coefficient of determination of 81% with only two predictors, and the average scores of PC2 with a coefficient of determination of 88% with only two predictors. All predictors were selected by the <italic>Lasso</italic> algorithm, which identifies the most relevant metrics (i.e., those that minimize prediction error) from the 127 available, with a maximum of three metrics per model.</p>
<p>The high adjusted coefficients of determination (adjusted <inline-formula id="inf43">
<mml:math id="m45">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>) and low <italic>p</italic>-values indicate that each of these models can be considered statistically reliable. Based on the model&#x2019;s estimated coefficients, the following conclusions can be drawn regarding the constant speed condition:<list list-type="simple">
<list-item>
<p>
<inline-formula id="inf44">
<mml:math id="m46">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Powerful</italic> attribute: the specific loudness of Bark 4 positively impacts this model, while the specific loudness of Bark 14 and the level (dB) per 1/3 octave band of the 4,000&#xa0;Hz band (3,548&#xa0;Hz&#x2013;4,467&#xa0;Hz) negatively impact it. This means that 1) an increase in the energy in this low-frequency range (Bark 4) makes the sound feel more powerful and robust, 2) excessive energy in this higher frequency range (Bark 14) can make the sound feel less powerful, and 3) higher levels of energy in the 4,000&#xa0;Hz band can reduce the overall sense of power.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf45">
<mml:math id="m47">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Aggressive</italic> attribute: the standard deviation (over time) of the frequency below which 85% of the total energy of the spectrum is contained negatively impacts this model, suggesting that less variation in high-frequency energy correlates with a more aggressive perception of the sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf46">
<mml:math id="m48">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Metallic</italic> attribute: the specific loudness of Bark 5 and 16 have opposite impacts on this model. Specifically, to sound more metallic, an SSV sound should have less energy in the Bark 5 band and more energy in the Bark 16 band.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf47">
<mml:math id="m49">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Soft</italic> attribute: the level in dB of the band centered at 63&#xa0;Hz (56.8 Hz&#x2013;70.8&#xa0;Hz) positively impacts this model, while the slope (over time) of the frequency below which 95% of the total energy of the spectrum is contained negatively impacts it. This suggests that higher energy content in the 56.8&#x2013;70.8&#xa0;Hz band and a lower Rolloff95 slope correlate with a softer sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf48">
<mml:math id="m50">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Vibrating</italic> attribute: the level in dB of the third-octave band centered at 200&#xa0;Hz (178&#xa0;Hz&#x2013;224&#xa0;Hz) positively impacts this model, while the dB level of the band centered at 1,000&#xa0;Hz (891&#xa0;Hz&#x2013;1,122&#xa0;Hz) as well as the slope of the rhythm attack negatively impacts it. This suggests that a higher energy content in the 178&#xa0;Hz&#x2013;224&#xa0;Hz band, a lower energy content in the 891&#xa0;Hz&#x2013;1,122&#xa0;Hz band, and a lower slope of attack (lower slope of transient events in the signal, i.e. reduced increase of transient events with time) correlate with a more vibrating sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf49">
<mml:math id="m51">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Noisy</italic> attribute: both the standard deviation of the brightness (variation of brightness over time) and the standard deviation (over time) of the frequency below which 85% of the total energy of the spectrum is contained negatively impacts this model. This suggests that lower variation (over time) of the energy in the mid-and high-frequency ranges correlates with a noisier sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf50">
<mml:math id="m52">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Desire-to-buy</italic>: the specific loudness of the Bark 17 band (3,150&#xa0;Hz&#x2013;3,700&#xa0;Hz) negatively impacts this model, while the level in dB of the band centered at 63&#xa0;Hz (56.2 Hz&#x2013;70.8&#xa0;Hz) positively impacts it. This suggests an incentive to design SSVs with a sound signature with more emphasis on low frequencies, as these frequencies contribute positively to the desire-to-buy score.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf51">
<mml:math id="m53">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> PC1: Both the level in dB of the band centered at 4,000&#xa0;Hz (3,548&#xa0;Hz&#x2013;4,467&#xa0;Hz) and the standard deviation of the Spectral Rollof85 metric positively impacts this model. It is noteworthy that these two metrics are also selected by <italic>Lasso</italic> in the models for the <italic>Powerful</italic> and <italic>Aggressive</italic> attributes.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf52">
<mml:math id="m54">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> PC2: the level in dB of the band centered at 40&#xa0;Hz (35.5 Hz&#x2013;44.7&#xa0;Hz) negatively impacts this model, while the slope of the spectral Rollof95 positively impacts it.</p>
</list-item>
</list>
</p>
</sec>
<sec id="s4-2">
<title>4.2 Models&#x2019; prediction for the acceleration condition</title>
<p>As can be seen in <xref ref-type="table" rid="T2">Table 2</xref>, the <italic>Lasso</italic> models were able to predict the <italic>Powerful</italic> attribute with a coefficient of determination of 91% using only one predictor, the <italic>Aggressive</italic> attribute with a coefficient of determination of 91% using only two predictors, the <italic>Metallic</italic> attribute with a coefficient of determination of 86% using only two predictors, the <italic>Soft</italic> attribute with a coefficient of determination of 95% using only two predictors, the <italic>Vibrating</italic> attribute with a coefficient of determination of 83% using only one predictor, the <italic>Noisy</italic> attribute with a coefficient of determination of 76% using only one predictor, and the overall <italic>Desire-to-Buy</italic> with a coefficient of determination of 75% using only two predictors. The models derived from <italic>Lasso</italic> were also able to predict the average scores of PC1 with a coefficient of determination of 83% with only one predictor, and the average scores of PC2 with a coefficient of determination of 93% with only two predictors. Here again, all predictors were selected by the <italic>Lasso</italic> algorithm, which identifies the most relevant metrics (i.e., those that minimize prediction error) from the 127 available, with a maximum of three metrics per model.</p>
<p>The high adjusted coefficients of determination (adjusted <inline-formula id="inf53">
<mml:math id="m55">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>) and low <italic>p</italic>-values indicate that each of these models can be considered statistically reliable. Based on the model&#x2019;s estimated coefficients, the following conclusions can be drawn regarding the acceleration condition:<list list-type="simple">
<list-item>
<p>
<inline-formula id="inf54">
<mml:math id="m56">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Powerful</italic> attribute: the slope (over time) of the specific loudness of Bark 11 positively impacts this model. This suggests that a steady increase in the energy in the Bark 11 band correlates with a more powerful perception of the sound during acceleration. This indicates that an increase in energy over time within this mid-frequency range (Bark 11) contributes to a more powerful and dynamic perception of the sound during acceleration.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf55">
<mml:math id="m57">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Aggressive</italic> attribute: the slope (over time) of the specific loudness of both Bark bands 11 and 12 positively impacts this model. This implies that a steady increase in the energy in these two Bark bands makes the sound of acceleration feel more aggressive.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf56">
<mml:math id="m58">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Metallic</italic> attribute: both the mean of the frequency below which 85% of the total energy of the spectrum is contained and the level in dB of the third-octave band centered at 3,150&#xa0;Hz positively impacts this model.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf57">
<mml:math id="m59">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Soft</italic> attribute: the standard deviation (over time) of the sharpness negatively impacts this model, while the level in dB of the third-octave band centered at 80&#xa0;Hz (70.8 Hz&#x2013;89.1&#xa0;Hz) positively impacts it. This suggests that a stable sharpness and a pronounced low-frequency content in the 80&#xa0;Hz band lead to a softer perception of the acceleration sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf58">
<mml:math id="m60">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Vibrating</italic> attribute: the slope (over time) of the specific loudness of Bark 6 positively impacts this model. This suggests that a steady increase in the energy of Bark 6 band will make the sound of acceleration feel more vibrating.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf59">
<mml:math id="m61">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Noisy</italic> attribute: the standard deviation (over time) of the specific loudness of Bark 14 positively impacts this model. This implies that greater variation in the loudness of the Bark 14 band correlates with a noisier perception of the acceleration sound.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf60">
<mml:math id="m62">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> <italic>Desire-to-buy</italic>: the slope (over time) of the specific loudness of both Bark 11 and 12 positively impacts this model. Notably, these two metrics are also selected by <italic>Lasso</italic> in the models for the <italic>Powerful</italic> and <italic>Aggressive</italic> attributes, suggesting that the sound signature of an SSV&#x2019;s acceleration should &#x201c;sound&#x201d; more <italic>Powerful</italic> and <italic>Aggressive</italic> to increase the desire to purchase.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf61">
<mml:math id="m63">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> PC1: the slope (over time) of the specific loudness of Bark 11 positively impacts this model.</p>
</list-item>
<list-item>
<p>
<inline-formula id="inf62">
<mml:math id="m64">
<mml:mrow>
<mml:mo>&#x2022;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> PC2: both the standard deviation (over time) of the specific loudness of Bark 16 and the slope of the spectral flatness positively impact this model.</p>
</list-item>
</list>
</p>
</sec>
<sec id="s4-3">
<title>4.3 Interpretation of models</title>
<p>In this study, we were also interested in communicating simply the meaning of the objective models using a simple holistic visual representation.</p>
<p>To this end, <xref ref-type="fig" rid="F4">Figures 4</xref>, <xref ref-type="fig" rid="F5">5</xref> present a summary of the sound signature and sound quality models for the constant speed and the acceleration conditions, respectively. These figures provide a visual illustration of the different models for predicting the sound signature and sound quality of SSVs with the metrics selected in each model. These figures also show the effectiveness of the <italic>Lasso</italic> in selecting only a few metrics to build these parsimonious models from a large metric bank.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Objective models of SSV sounds for constant speed condition. The colors are associated with the attributes to be predicted. The area of each metric (represented by a rectangle) is relative to its contribution (or coefficient <inline-formula id="inf63">
<mml:math id="m65">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>) in the model. The description of metrics can be found in <xref ref-type="table" rid="T3">Table 3</xref>. Rectangles are ordered from largest to smallest from left to right and from top to bottom. A minus sign <inline-formula id="inf64">
<mml:math id="m66">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is shown in front of metrics that have a negative coefficient in the model.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Objective models of SSV sounds for acceleration condition. The colors are associated with the attributes to be predicted. The area of each metric (represented by a rectangle) is relative to its contribution (or coefficient <inline-formula id="inf65">
<mml:math id="m67">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>) in the model. The description of metrics can be found in <xref ref-type="table" rid="T3">Table 3</xref>. Rectangles are ordered from largest to smallest from left to right and from top to bottom. A minus sign <inline-formula id="inf66">
<mml:math id="m68">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is shown in front of metrics that have a negative coefficient in the model.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g005.tif"/>
</fig>
<p>From the models developed in this paper, it is now possible to retrieve the sound signature and sound quality of current SSVs and predict those of sounds measured on new SSVs or with virtually modified sounds. However, comparing vehicles based on all these models (all metrics in all three conditions) is likely to be confusing. Therefore, to simplify this, i.e., to make it easier to grasp the contribution of each metric and to compare between sounds, we created a tool named &#x201c;attribute wheel of SSVs.&#x201d; This tool allows one to easily visualize the different metrics, their contributions, the corresponding perceptual attributes, and the operating conditions for a given vehicle. It is typically read from the center to the circumference. This wheel of attributes is equivalent to the wine aroma wheel (<xref ref-type="bibr" rid="B18">Noble et al., 1987</xref>). As an example, <xref ref-type="fig" rid="F6">Figure 6</xref> shows the attribute wheel for the second vehicle (named V2 hereafter). The attribute wheel has three levels (the three circular rings in <xref ref-type="fig" rid="F6">Figure 6</xref>):<list list-type="simple">
<list-item>
<p>1. The operational conditions are represented by three different categories: Constant speed (Cst speed), idle, and acceleration. Note that models for the idle condition are not reported in this paper.</p>
</list-item>
<list-item>
<p>2. The scores of the attributes and the <italic>Desire-to-buy</italic>, represented by the areas of sectors for each attribute. The score values are ordered clockwise from the largest to the smallest value for each condition.</p>
</list-item>
<list-item>
<p>3. The objective metrics retained in the sparse models, represented by sectors of the outer ring. Each attribute is subdivided by the number of retained metrics in the model using the metric coefficients as bin sizes. A minus sign in the metric indicates a negative coefficient of this metric in the model.</p>
</list-item>
</list>
</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Wheel of attributes for vehicle V2. The attribute scores are ordered for each driving condition from largest to smallest in a clockwise direction. Starting at the center ring with the conditions, we move towards the outer rings, with attributes in the second ring and metrics in the last ring. The size of each metric is relative to its contribution in the model. The description of metrics can be found in <xref ref-type="table" rid="T3">Table 3</xref>. In the third ring, the colors assigned to the metrics do not carry any specific meaning. They are solely added to differentiate between the metrics visually. The purpose of using different colors is to aid in the visual distinction and organization of the metrics within the model. It is important to note that the colors do not convey any additional information or signify any particular significance or relationship among the metrics.</p>
</caption>
<graphic xlink:href="facou-02-1477395-g006.tif"/>
</fig>
<p>For instance, for the acceleration condition of V2, shown in <xref ref-type="fig" rid="F6">Figure 6</xref>, the <italic>Aggressive</italic> attribute has the largest score compared to the other attributes. The <italic>Aggressive</italic> objective model involves the two metrics N&#x2032; B12 Slope and N&#x2032; B11 Slope. These two metrics are the band-specific loudness slopes of Bark bands 11 and 12 (1,270&#xa0;Hz&#x2013;1720&#xa0;Hz), respectively. This result suggests that the aggressiveness of the acceleration sound is predicted by the time variation of the spectral content in these two Bark bands. The graph also suggests that the effect of the N&#x2032; B12 Slope predictor is much larger than the N&#x2032; B11 Slope predictor in the model. The graph also shows that the same two metrics are involved in the <italic>Desire-to-buy</italic> objective model for this condition. Therefore, any positive variation in these two metrics will result in positive variations of the <italic>Aggressive</italic> attribute and <italic>Desire-to-buy</italic>. The inclusion of <italic>Desire-to-buy</italic> as one of the perceptual attributes in <xref ref-type="fig" rid="F6">Figure 6</xref> may seem odd. Specifically, in the idle condition, the features selected for the <italic>Desire-to-buy</italic> model do not match those of any of the perceptual attribute models. However, it should be noted that the idle condition may not be as critical in influencing the overall &#x201c;desire to purchase&#x201d; factor as the acceleration condition. Interestingly, in the acceleration condition, the two parameters used in the <italic>Desire-to-buy</italic> model are identical to those of the <italic>Aggressive</italic> perceptual attribute. This observation suggests a potential correlation between the perception of aggressiveness and the <italic>Desire-to-buy</italic> during acceleration, which could be a valuable element for further study.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s5">
<title>5 Discussion</title>
<p>The results show that the <italic>Lasso</italic> can select a few significant metrics from a large bank of metrics for the objective models of subjective assessments of SSV sounds. Indeed, when generating models (of sensory profiles, sound quality, and principal components of the sensory attributes), the <italic>Lasso</italic> retained only one, two, or three predictors at most in each model from a list of 127 potential predictors (182 predictors for rapid acceleration), leading to parsimonious and easily understandable models.</p>
<p>Overall, the objective model for <italic>Desire-to-buy</italic> suggests designing SSVs with a sound signature that emphasizes low frequencies. Also, since the acceleration condition (non-stationary signals) is important for the global sound quality of SSVs, the objective models should include time variation properties of the related signals and not just the time-averaged values.</p>
<p>For the reported data, the constructed models have good consistency and statistical significance. However, since the number of samples in the cross-validation data was small, the significance of these models for new sounds (samples that are distinct from the sounds used in the listening tests) needs to be investigated.</p>
<p>In this study, we also propose a graphical visualization tool (attribute wheel of SSVs) to easily interpret the objective models of the sound signature and sound quality of SSVs. For instance, on practical grounds, this resulted in useful indications for sound quality optimization and for adjusting the sound signature of the SSVs for the industrial partner that pursues the constant amelioration of the sound of the SSVs.</p>
</sec>
<sec sec-type="conclusion" id="s6">
<title>6 Conclusion</title>
<p>The goal of this study was to develop objective models of subjective assessments of SSV sounds. The applications of these models being, first the prediction of sound quality of side-by-side vehicles (SSV), and second, the explanation of the underlying structure of perceived sound quality of SSV to guide engineers in future design (i.e. increase this sound, reduce the brightness, etc.). This paper has provided a set of experimental results that allow a better understanding of the sensory profiles and sound quality of SSVs using physical and psychoacoustic metrics. When generating the models, the <italic>Lasso</italic> retained only a few significant metrics in each model from a large number of potential predictors, which led to parsimonious and easily interpretable models. In addition, a graphical tool for visualizing the metrics, named &#x201c;attribute wheel of SSVs,&#x201d; was developed as part of this study. It facilitates the interpretation of the contributions of metrics in models on the overall sound quality of SSVs. This has led to useful insights for sound quality optimization and for adjusting the sound signature of SSVs in general and the studied vehicle in particular. Using such illustrations and models, acoustic engineers from the SSV manufacturer can adjust future designs for a stronger desirability or a better sensory profile of SSVs.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s8">
<title>Ethics statement</title>
<p>The studies involving humans were approved by CER Lettre et sciences humaines, Universit&#xe9; de Sherbrooke. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s9">
<title>Author contributions</title>
<p>AB: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Project administration, Resources, Software, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. OV: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Project administration, Resources, Software, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. P-AG: Conceptualization, Funding acquisition, Project administration, Supervision, Writing&#x2013;original draft, Writing&#x2013;review and editing. AB: Conceptualization, Funding acquisition, Project administration, Supervision, Writing&#x2013;original draft, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s10">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. The authors wish to acknowledge the financial support from the &#x201c;Natural Sciences and Engineering Research Council of Canada&#x201d; (NSERC), &#x201c;Bombardier Recreational Products&#x201d; (BRP) and the &#x201c;Centre de Technologies Avanc&#xe9;es BRP-UdeS&#x201d; (CTA).</p>
</sec>
<ack>
<p>The authors wish to acknowledge the technical support provided by the members of the dXBel project. The authors would like to thank Paul Mass&#xe9; from the BRP marketing group for moderating the group discussions and for his support as well as all participants who completed the subjective experiments described in this paper. The data collection with human subjects was approved by the ethical committee <italic>C&#xc9;R - Lettres et sciences humaines</italic> of Universit&#xe9; de Sherbrooke (&#x23;2017-1546).</p>
</ack>
<sec sec-type="COI-statement" id="s11">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aures</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>&#x2018;berechnungsverfahren f&#xfc;r den sensorischen wohlklang beliebiger schallsignale&#x2019; (a model for calculating the sensory euphony of various sounds)</article-title>. <source>Acustica</source> <volume>59</volume>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benghanem</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Valentin</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Gauthier</surname>
<given-names>P.-A.</given-names>
</name>
<name>
<surname>Berry</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Sound quality of side-by-side vehicles: Investigation of multidimensional sensory profiles and loudness equalization in an industrial context</article-title>. <source>Acta Acust.</source> <volume>5</volume>, <fpage>7</fpage>. <comment>Publisher: EDP Sciences</comment>. <pub-id pub-id-type="doi">10.1051/aacus/2020032</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Research on prediction model of tractor sound quality based on genetic algorithm</article-title>. <source>Appl. Acoust.</source> <volume>185</volume>, <fpage>108411</fpage>. <pub-id pub-id-type="doi">10.1016/j.apacoust.2021.108411</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Vehicle interior sound quality analysis by using grey relational analysis</article-title>. <source>SAE Int. J. Passeng. Cars Mech. Syst.</source> <volume>7</volume>, <fpage>355</fpage>&#x2013;<lpage>366</lpage>. <pub-id pub-id-type="doi">10.4271/2014-01-1976</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Fazekas</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Sandler</surname>
<given-names>M. B.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A tutorial on deep learning for music information retrieval</article-title>. <source>Corr. abs/1709</source>, <fpage>04396</fpage>.</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Downie</surname>
<given-names>J. S.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Music information retrieval</article-title>. <source>Annu. Rev. Inf. Sci. Technol.</source> <volume>37</volume>, <fpage>295</fpage>&#x2013;<lpage>340</lpage>. <pub-id pub-id-type="doi">10.1002/aris.1440370108</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Fastl</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zwicker</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2007</year>). <source>Psychoacoustics: facts and models</source>. <edition>22</edition>. <publisher-loc>Berlin and Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>A note on the group lasso and a sparse group lasso</article-title>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gauthier</surname>
<given-names>P.-A.</given-names>
</name>
<name>
<surname>Scullion</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Berry</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Sound quality prediction based on systematic metric selection and shrinkage: comparison of stepwise, lasso, and elastic-net algorithms and clustering preprocessing</article-title>. <source>J. Sound Vib.</source> <volume>400</volume>, <fpage>134</fpage>&#x2013;<lpage>153</lpage>. <pub-id pub-id-type="doi">10.1016/j.jsv.2017.03.025</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Pure electric vehicle nonstationary interior sound quality prediction based on deep cnns with an adaptable learning rate tree</article-title>. <source>Mech. Syst. Signal Process.</source> <volume>148</volume>, <fpage>107170</fpage>. <pub-id pub-id-type="doi">10.1016/j.ymssp.2020.107170</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Sound quality prediction and improving of vehicle interior noise based on deep convolutional neural networks</article-title>. <source>Expert Syst. Appl.</source> <volume>160</volume>, <fpage>113657</fpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2020.113657</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Subjective and objective quantificational description of vehicle interior noise during acceleration</article-title>. <source>Appl. Mech. &#x26; Mater.</source> <volume>518</volume>, <fpage>297</fpage>&#x2013;<lpage>302</lpage>. <pub-id pub-id-type="doi">10.4028/www.scientific.net/amm.518.297</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>T. G.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-K.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>H. H.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Characterization and quantification of luxury sound quality in premium-class passenger cars</article-title>. <source>Proc. Institution Mech. Eng. &#x2013; Part D &#x2013; J. Automob. Eng.</source> <volume>223</volume>, <fpage>343</fpage>&#x2013;<lpage>353</lpage>. <pub-id pub-id-type="doi">10.1243/09544070jauto989</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwon</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Jo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>Y. J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Model of psychoacoustic sportiness for vehicle interior sound: excluding loudness</article-title>. <source>Appl. Acoust.</source> <volume>136</volume>, <fpage>16</fpage>&#x2013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.apacoust.2018.01.027</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lartillot</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2014</year>). <source>
<italic>MIRtoolbox 1.6.1</italic>. User&#x2019;s manual</source>. <publisher-loc>Denmark</publisher-loc>: <publisher-name>Aalborg University</publisher-name>.</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>S.-K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Objective evaluation of interior sound quality in passenger cars during acceleration</article-title>. <source>J. Sound Vib.</source> <volume>310</volume>, <fpage>149</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1016/j.jsv.2007.07.073</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lyon</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>An introduction to sound quality</article-title>. <source>J. Sound Vib.</source> <volume>6</volume>, <fpage>6</fpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Noble</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Arnold</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Buechsenstein</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Leach</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Stern</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Modification of a standardized system of wine aroma terminology</article-title>. <source>Am. J. Enol. Vitic.</source> <volume>38</volume>, <fpage>143</fpage>&#x2013;<lpage>146</lpage>. <pub-id pub-id-type="doi">10.5344/ajev.1987.38.2.143</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Otto</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Amman</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Eaton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lake</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2001</year>) &#x201c;<article-title>Guidelines for jury evaluations of automotive sounds</article-title>,&#x201d; in <source>Sound and vibration</source>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>.</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paulraj</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Melvin</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Sazali</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Car cabin interior noise classification using temporal composite features and probabilistic neural network model</article-title>. <source>Appl. Mech. Mater.</source> <volume>471</volume>, <fpage>64</fpage>&#x2013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.4028/www.scientific.net/amm.471.64</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rumsey</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Searching, analyzing, and recommending audio content</article-title>. <source>JAES</source> <volume>57</volume>, <fpage>166</fpage>&#x2013;<lpage>169</lpage>.</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Regression shrinkage and selection via the lasso</article-title>. <source>J. R. Stat. Soc. Ser. B Methodol.</source> <volume>58</volume>, <fpage>267</fpage>&#x2013;<lpage>288</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The solution path of the generalized lasso</article-title>. <source>Ann. Statistics</source> <volume>39</volume>, <fpage>1335</fpage>&#x2013;<lpage>1371</lpage>. <pub-id pub-id-type="doi">10.1214/11-aos878</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Urbano</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Serra</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Evaluation in music information retrieval</article-title>. <source>J. Intell. Inf. Syst.</source> <volume>41</volume>, <fpage>345</fpage>&#x2013;<lpage>369</lpage>. <pub-id pub-id-type="doi">10.1007/s10844-013-0249-4</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A sound quality model for objective synthesis evaluation of vehicle interior noise based on artificial neural network</article-title>. <source>Mech. Syst. Signal Process.</source> <volume>45</volume>, <fpage>255</fpage>&#x2013;<lpage>266</lpage>. <pub-id pub-id-type="doi">10.1016/j.ymssp.2013.11.001</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wright</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Coordinate descent algorithms</article-title>. <source>Math. Program</source> <volume>151</volume>, <fpage>3</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1007/s10107-015-0892-3</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chiong</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Forecasting interval time series using a fully complex-valued rbf neural network with dpso and pso algorithms</article-title>. <source>Inf. Sci.</source> <volume>305</volume>, <fpage>77</fpage>&#x2013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1016/j.ins.2015.01.029</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Zhekova</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2007</year>). <source>Analyse temps-fr&#xe9;quence et synth&#xe8;se granulaire des bruits moteur diesel au ralenti: Application pour &#xe9;tude perceptive dans le contexte des sc&#xe8;nes auditives</source>. <publisher-loc>Marseille, France</publisher-loc>.</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zou</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Regularization and variable selection via the elastic net</article-title>. <source>J. R. Stat. Soc. Ser. B Stat. Methodol.</source> <volume>67</volume>, <fpage>301</fpage>&#x2013;<lpage>320</lpage>. <pub-id pub-id-type="doi">10.1111/j.1467-9868.2005.00503.x</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Zwicker</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fastl</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>1999</year>). <source>Psychoacoustics: facts and models</source>. <edition>2 edn</edition>. <publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>.</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zwicker</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fastl</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Widmann</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Kurakata</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kuwano</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Namba</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>1991</year>). <article-title>Program for calculating loudness according to din 45631 (ISO532B)</article-title>. <source>J. Acoust. Soc. Jpn. (E)</source> <volume>12</volume>, <fpage>39</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1250/ast.12.39</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>